Blame - webrtc/modules/audio_coding/neteq/include/neteq.h - webrtc.googlesource.com/src

blob: d6c359b0eb96fc8c67f1f85063f835bac222e091 [file] [log] [blame]

henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	1	/*
				2	* Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
				3	*
				4	* Use of this source code is governed by a BSD-style license
				5	* that can be found in the LICENSE file in the root of the source
				6	* tree. An additional intellectual property rights grant can be found
				7	* in the file PATENTS. All contributing project authors may
				8	* be found in the AUTHORS file in the root of the source tree.
				9	*/
				10
Henrik Kjellander	7464089	2015-10-29 11:31:02 +0100	[diff] [blame]	11	#ifndef WEBRTC_MODULES_AUDIO_CODING_NETEQ_INCLUDE_NETEQ_H_
				12	#define WEBRTC_MODULES_AUDIO_CODING_NETEQ_INCLUDE_NETEQ_H_
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	13
pbos@webrtc.org	12dc1a3	2013-08-05 16:22:53 +0000	[diff] [blame]	14	#include <string.h> // Provide access to size_t.
				15
Henrik Lundin	905495c	2015-05-25 16:58:41 +0200	[diff] [blame]	16	#include <string>
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	17
henrike@webrtc.org	88fbb2d	2014-05-21 21:18:46 +0000	[diff] [blame]	18	#include "webrtc/base/constructormagic.h"
sprang@webrtc.org	fe5d36b	2013-10-28 09:21:07 +0000	[diff] [blame]	19	#include "webrtc/common_types.h"
kwiberg@webrtc.org	e04a93b	2014-12-09 10:12:53 +0000	[diff] [blame]	20	#include "webrtc/modules/audio_coding/neteq/audio_decoder_impl.h"
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	21	#include "webrtc/typedefs.h"
				22
				23	namespace webrtc {
				24
				25	// Forward declarations.
				26	struct WebRtcRTPHeader;
				27
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	28	struct NetEqNetworkStatistics {
				29	uint16_t current_buffer_size_ms; // Current jitter buffer size in ms.
				30	uint16_t preferred_buffer_size_ms; // Target buffer size in ms.
				31	uint16_t jitter_peaks_found; // 1 if adding extra delay due to peaky
				32	// jitter; 0 otherwise.
				33	uint16_t packet_loss_rate; // Loss rate (network + late) in Q14.
				34	uint16_t packet_discard_rate; // Late loss rate in Q14.
				35	uint16_t expand_rate; // Fraction (of original stream) of synthesized
minyue@webrtc.org	7d721ee	2015-02-18 10:01:53 +0000	[diff] [blame]	36	// audio inserted through expansion (in Q14).
				37	uint16_t speech_expand_rate; // Fraction (of original stream) of synthesized
				38	// speech inserted through expansion (in Q14).
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	39	uint16_t preemptive_rate; // Fraction of data inserted through pre-emptive
				40	// expansion (in Q14).
				41	uint16_t accelerate_rate; // Fraction of data removed through acceleration
				42	// (in Q14).
minyue@webrtc.org	2c1bcf2	2015-02-17 10:17:09 +0000	[diff] [blame]	43	uint16_t secondary_decoded_rate; // Fraction of data coming from secondary
				44	// decoding (in Q14).
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	45	int32_t clockdrift_ppm; // Average clock-drift in parts-per-million
				46	// (positive or negative).
Peter Kasting	dce40cf	2015-08-24 14:52:23 -0700	[diff] [blame]	47	size_t added_zero_samples; // Number of zero samples added in "off" mode.
Henrik Lundin	1bb8cf8	2015-08-25 13:08:04 +0200	[diff] [blame]	48	// Statistics for packet waiting times, i.e., the time between a packet
				49	// arrives until it is decoded.
				50	int mean_waiting_time_ms;
				51	int median_waiting_time_ms;
				52	int min_waiting_time_ms;
				53	int max_waiting_time_ms;
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	54	};
				55
				56	enum NetEqOutputType {
				57	kOutputNormal,
				58	kOutputPLC,
				59	kOutputCNG,
				60	kOutputPLCtoCNG,
				61	kOutputVADPassive
				62	};
				63
				64	enum NetEqPlayoutMode {
				65	kPlayoutOn,
				66	kPlayoutOff,
				67	kPlayoutFax,
				68	kPlayoutStreaming
				69	};
				70
				71	// This is the interface class for NetEq.
				72	class NetEq {
				73	public:
henrik.lundin@webrtc.org	ea25784	2014-08-07 12:27:37 +0000	[diff] [blame]	74	enum BackgroundNoiseMode {
				75	kBgnOn, // Default behavior with eternal noise.
				76	kBgnFade, // Noise fades to zero after some time.
				77	kBgnOff // Background noise is always zero.
				78	};
				79
henrik.lundin@webrtc.org	35ead38	2014-04-14 18:49:17 +0000	[diff] [blame]	80	struct Config {
				81	Config()
				82	: sample_rate_hz(16000),
henrik.lundin@webrtc.org	116ed1d	2014-04-28 08:20:04 +0000	[diff] [blame]	83	enable_audio_classifier(false),
henrik.lundin	9bc2667	2015-11-02 03:25:57 -0800	[diff] [blame]	84	enable_post_decode_vad(false),
henrik.lundin@webrtc.org	116ed1d	2014-04-28 08:20:04 +0000	[diff] [blame]	85	max_packets_in_buffer(50),
				86	// \|max_delay_ms\| has the same effect as calling SetMaximumDelay().
henrik.lundin@webrtc.org	ea25784	2014-08-07 12:27:37 +0000	[diff] [blame]	87	max_delay_ms(2000),
henrik.lundin@webrtc.org	7cbc4f9	2014-10-07 06:37:39 +0000	[diff] [blame]	88	background_noise_mode(kBgnOff),
Henrik Lundin	cf808d2	2015-05-27 14:33:29 +0200	[diff] [blame]	89	playout_mode(kPlayoutOn),
				90	enable_fast_accelerate(false) {}
henrik.lundin@webrtc.org	35ead38	2014-04-14 18:49:17 +0000	[diff] [blame]	91
Henrik Lundin	905495c	2015-05-25 16:58:41 +0200	[diff] [blame]	92	std::string ToString() const;
				93
Henrik Lundin	83b5c05	2015-05-08 10:33:57 +0200	[diff] [blame]	94	int sample_rate_hz; // Initial value. Will change with input data.
henrik.lundin@webrtc.org	35ead38	2014-04-14 18:49:17 +0000	[diff] [blame]	95	bool enable_audio_classifier;
henrik.lundin	9bc2667	2015-11-02 03:25:57 -0800	[diff] [blame]	96	bool enable_post_decode_vad;
Peter Kasting	dce40cf	2015-08-24 14:52:23 -0700	[diff] [blame]	97	size_t max_packets_in_buffer;
henrik.lundin@webrtc.org	116ed1d	2014-04-28 08:20:04 +0000	[diff] [blame]	98	int max_delay_ms;
henrik.lundin@webrtc.org	ea25784	2014-08-07 12:27:37 +0000	[diff] [blame]	99	BackgroundNoiseMode background_noise_mode;
henrik.lundin@webrtc.org	7cbc4f9	2014-10-07 06:37:39 +0000	[diff] [blame]	100	NetEqPlayoutMode playout_mode;
Henrik Lundin	cf808d2	2015-05-27 14:33:29 +0200	[diff] [blame]	101	bool enable_fast_accelerate;
henrik.lundin@webrtc.org	35ead38	2014-04-14 18:49:17 +0000	[diff] [blame]	102	};
				103
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	104	enum ReturnCodes {
				105	kOK = 0,
				106	kFail = -1,
				107	kNotImplemented = -2
				108	};
				109
				110	enum ErrorCodes {
				111	kNoError = 0,
				112	kOtherError,
				113	kInvalidRtpPayloadType,
				114	kUnknownRtpPayloadType,
				115	kCodecNotSupported,
				116	kDecoderExists,
				117	kDecoderNotFound,
				118	kInvalidSampleRate,
				119	kInvalidPointer,
				120	kAccelerateError,
				121	kPreemptiveExpandError,
				122	kComfortNoiseErrorCode,
				123	kDecoderErrorCode,
				124	kOtherDecoderError,
				125	kInvalidOperation,
				126	kDtmfParameterError,
				127	kDtmfParsingError,
				128	kDtmfInsertError,
				129	kStereoNotSupported,
				130	kSampleUnderrun,
				131	kDecodedTooMuch,
				132	kFrameSplitError,
				133	kRedundancySplitError,
minyue@webrtc.org	7bb5436	2013-08-06 05:40:57 +0000	[diff] [blame]	134	kPacketBufferCorruption,
turaj@webrtc.org	7b75ac6	2013-09-26 00:27:56 +0000	[diff] [blame]	135	kSyncPacketNotAccepted
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	136	};
				137
henrik.lundin@webrtc.org	35ead38	2014-04-14 18:49:17 +0000	[diff] [blame]	138	// Creates a new NetEq object, with parameters set in \|config\|. The \|config\|
				139	// object will only have to be valid for the duration of the call to this
				140	// method.
				141	static NetEq* Create(const NetEq::Config& config);
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	142
				143	virtual ~NetEq() {}
				144
				145	// Inserts a new packet into NetEq. The \|receive_timestamp\| is an indication
				146	// of the time when the packet was received, and should be measured with
				147	// the same tick rate as the RTP timestamp of the current payload.
				148	// Returns 0 on success, -1 on failure.
				149	virtual int InsertPacket(const WebRtcRTPHeader& rtp_header,
				150	const uint8_t* payload,
pkasting@chromium.org	4591fbd	2014-11-20 22:28:14 +0000	[diff] [blame]	151	size_t length_bytes,
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	152	uint32_t receive_timestamp) = 0;
				153
turaj@webrtc.org	7b75ac6	2013-09-26 00:27:56 +0000	[diff] [blame]	154	// Inserts a sync-packet into packet queue. Sync-packets are decoded to
				155	// silence and are intended to keep AV-sync intact in an event of long packet
				156	// losses when Video NACK is enabled but Audio NACK is not. Clients of NetEq
				157	// might insert sync-packet when they observe that buffer level of NetEq is
				158	// decreasing below a certain threshold, defined by the application.
				159	// Sync-packets should have the same payload type as the last audio payload
				160	// type, i.e. they cannot have DTMF or CNG payload type, nor a codec change
				161	// can be implied by inserting a sync-packet.
				162	// Returns kOk on success, kFail on failure.
				163	virtual int InsertSyncPacket(const WebRtcRTPHeader& rtp_header,
				164	uint32_t receive_timestamp) = 0;
				165
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	166	// Instructs NetEq to deliver 10 ms of audio data. The data is written to
				167	// \|output_audio\|, which can hold (at least) \|max_length\| elements.
				168	// The number of channels that were written to the output is provided in
				169	// the output variable \|num_channels\|, and each channel contains
				170	// \|samples_per_channel\| elements. If more than one channel is written,
				171	// the samples are interleaved.
				172	// The speech type is written to \|type\|, if \|type\| is not NULL.
				173	// Returns kOK on success, or kFail in case of an error.
				174	virtual int GetAudio(size_t max_length, int16_t* output_audio,
Peter Kasting	dce40cf	2015-08-24 14:52:23 -0700	[diff] [blame]	175	size_t* samples_per_channel, int* num_channels,
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	176	NetEqOutputType* type) = 0;
				177
				178	// Associates \|rtp_payload_type\| with \|codec\| and stores the information in
				179	// the codec database. Returns 0 on success, -1 on failure.
kwiberg	ee1879c	2015-10-29 06:20:28 -0700	[diff] [blame]	180	virtual int RegisterPayloadType(NetEqDecoder codec,
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	181	uint8_t rtp_payload_type) = 0;
				182
				183	// Provides an externally created decoder object \|decoder\| to insert in the
				184	// decoder database. The decoder implements a decoder of type \|codec\| and
Karl Wiberg	d8399e6	2015-05-25 14:39:56 +0200	[diff] [blame]	185	// associates it with \|rtp_payload_type\|. The decoder will produce samples
				186	// at the rate \|sample_rate_hz\|. Returns kOK on success, kFail on failure.
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	187	virtual int RegisterExternalDecoder(AudioDecoder* decoder,
kwiberg	ee1879c	2015-10-29 06:20:28 -0700	[diff] [blame]	188	NetEqDecoder codec,
Karl Wiberg	d8399e6	2015-05-25 14:39:56 +0200	[diff] [blame]	189	uint8_t rtp_payload_type,
				190	int sample_rate_hz) = 0;
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	191
				192	// Removes \|rtp_payload_type\| from the codec database. Returns 0 on success,
				193	// -1 on failure.
				194	virtual int RemovePayloadType(uint8_t rtp_payload_type) = 0;
				195
turaj@webrtc.org	f1efc57	2013-08-16 23:44:24 +0000	[diff] [blame]	196	// Sets a minimum delay in millisecond for packet buffer. The minimum is
				197	// maintained unless a higher latency is dictated by channel condition.
				198	// Returns true if the minimum is successfully applied, otherwise false is
				199	// returned.
				200	virtual bool SetMinimumDelay(int delay_ms) = 0;
				201
				202	// Sets a maximum delay in milliseconds for packet buffer. The latency will
				203	// not exceed the given value, even required delay (given the channel
henrik.lundin@webrtc.org	116ed1d	2014-04-28 08:20:04 +0000	[diff] [blame]	204	// conditions) is higher. Calling this method has the same effect as setting
				205	// the \|max_delay_ms\| value in the NetEq::Config struct.
turaj@webrtc.org	f1efc57	2013-08-16 23:44:24 +0000	[diff] [blame]	206	virtual bool SetMaximumDelay(int delay_ms) = 0;
				207
				208	// The smallest latency required. This is computed bases on inter-arrival
				209	// time and internal NetEq logic. Note that in computing this latency none of
				210	// the user defined limits (applied by calling setMinimumDelay() and/or
				211	// SetMaximumDelay()) are applied.
				212	virtual int LeastRequiredDelayMs() const = 0;
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	213
				214	// Not implemented.
				215	virtual int SetTargetDelay() = 0;
				216
				217	// Not implemented.
				218	virtual int TargetDelay() = 0;
				219
henrik.lundin	9c3efd0	2015-08-27 13:12:22 -0700	[diff] [blame]	220	// Returns the current total delay (packet buffer and sync buffer) in ms.
				221	virtual int CurrentDelayMs() const = 0;
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	222
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	223	// Sets the playout mode to \|mode\|.
henrik.lundin@webrtc.org	7cbc4f9	2014-10-07 06:37:39 +0000	[diff] [blame]	224	// Deprecated. Set the mode in the Config struct passed to the constructor.
				225	// TODO(henrik.lundin) Delete.
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	226	virtual void SetPlayoutMode(NetEqPlayoutMode mode) = 0;
				227
				228	// Returns the current playout mode.
henrik.lundin@webrtc.org	7cbc4f9	2014-10-07 06:37:39 +0000	[diff] [blame]	229	// Deprecated.
				230	// TODO(henrik.lundin) Delete.
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	231	virtual NetEqPlayoutMode PlayoutMode() const = 0;
				232
				233	// Writes the current network statistics to \|stats\|. The statistics are reset
				234	// after the call.
				235	virtual int NetworkStatistics(NetEqNetworkStatistics* stats) = 0;
				236
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	237	// Writes the current RTCP statistics to \|stats\|. The statistics are reset
				238	// and a new report period is started with the call.
				239	virtual void GetRtcpStatistics(RtcpStatistics* stats) = 0;
				240
				241	// Same as RtcpStatistics(), but does not reset anything.
				242	virtual void GetRtcpStatisticsNoReset(RtcpStatistics* stats) = 0;
				243
				244	// Enables post-decode VAD. When enabled, GetAudio() will return
				245	// kOutputVADPassive when the signal contains no speech.
				246	virtual void EnableVad() = 0;
				247
				248	// Disables post-decode VAD.
				249	virtual void DisableVad() = 0;
				250
wu@webrtc.org	94454b7	2014-06-05 20:34:08 +0000	[diff] [blame]	251	// Gets the RTP timestamp for the last sample delivered by GetAudio().
				252	// Returns true if the RTP timestamp is valid, otherwise false.
				253	virtual bool GetPlayoutTimestamp(uint32_t* timestamp) = 0;
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	254
				255	// Not implemented.
				256	virtual int SetTargetNumberOfChannels() = 0;
				257
				258	// Not implemented.
				259	virtual int SetTargetSampleRate() = 0;
				260
				261	// Returns the error code for the last occurred error. If no error has
				262	// occurred, 0 is returned.
henrik.lundin@webrtc.org	b0f4b3d	2014-11-04 08:53:10 +0000	[diff] [blame]	263	virtual int LastError() const = 0;
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	264
				265	// Returns the error code last returned by a decoder (audio or comfort noise).
				266	// When LastError() returns kDecoderErrorCode or kComfortNoiseErrorCode, check
				267	// this method to get the decoder's error code.
				268	virtual int LastDecoderError() = 0;
				269
				270	// Flushes both the packet buffer and the sync buffer.
				271	virtual void FlushBuffers() = 0;
				272
turaj@webrtc.org	7df9706	2013-08-02 18:07:13 +0000	[diff] [blame]	273	// Current usage of packet-buffer and it's limits.
				274	virtual void PacketBufferStatistics(int* current_num_packets,
henrik.lundin@webrtc.org	116ed1d	2014-04-28 08:20:04 +0000	[diff] [blame]	275	int* max_num_packets) const = 0;
turaj@webrtc.org	7df9706	2013-08-02 18:07:13 +0000	[diff] [blame]	276
henrik.lundin	48ed930	2015-10-29 05:36:24 -0700	[diff] [blame]	277	// Enables NACK and sets the maximum size of the NACK list, which should be
				278	// positive and no larger than Nack::kNackListSizeLimit. If NACK is already
				279	// enabled then the maximum NACK list size is modified accordingly.
				280	virtual void EnableNack(size_t max_nack_list_size) = 0;
				281
				282	virtual void DisableNack() = 0;
				283
				284	// Returns a list of RTP sequence numbers corresponding to packets to be
				285	// retransmitted, given an estimate of the round-trip time in milliseconds.
				286	virtual std::vector<uint16_t> GetNackList(
				287	int64_t round_trip_time_ms) const = 0;
minyue@webrtc.org	d730177	2013-08-29 00:58:14 +0000	[diff] [blame]	288
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	289	protected:
				290	NetEq() {}
				291
				292	private:
henrikg	3c089d7	2015-09-16 05:37:44 -0700	[diff] [blame]	293	RTC_DISALLOW_COPY_AND_ASSIGN(NetEq);
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	294	};
				295
				296	} // namespace webrtc
Henrik Kjellander	7464089	2015-10-29 11:31:02 +0100	[diff] [blame]	297	#endif // WEBRTC_MODULES_AUDIO_CODING_NETEQ_INCLUDE_NETEQ_H_