Blame - webrtc/modules/audio_coding/neteq/include/neteq.h - webrtc.googlesource.com/src

blob: fd1041a1ea3cf13a7053a7605f0693266e8d5cb5 [file] [log] [blame]

henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	1	/*
				2	* Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
				3	*
				4	* Use of this source code is governed by a BSD-style license
				5	* that can be found in the LICENSE file in the root of the source
				6	* tree. An additional intellectual property rights grant can be found
				7	* in the file PATENTS. All contributing project authors may
				8	* be found in the AUTHORS file in the root of the source tree.
				9	*/
				10
Henrik Kjellander	7464089	2015-10-29 11:31:02 +0100	[diff] [blame]	11	#ifndef WEBRTC_MODULES_AUDIO_CODING_NETEQ_INCLUDE_NETEQ_H_
				12	#define WEBRTC_MODULES_AUDIO_CODING_NETEQ_INCLUDE_NETEQ_H_
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	13
pbos@webrtc.org	12dc1a3	2013-08-05 16:22:53 +0000	[diff] [blame]	14	#include <string.h> // Provide access to size_t.
				15
Henrik Lundin	905495c	2015-05-25 16:58:41 +0200	[diff] [blame]	16	#include <string>
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	17
henrike@webrtc.org	88fbb2d	2014-05-21 21:18:46 +0000	[diff] [blame]	18	#include "webrtc/base/constructormagic.h"
henrik.lundin	9a410dd	2016-04-06 01:39:22 -0700	[diff] [blame]	19	#include "webrtc/base/optional.h"
ossu	e352578	2016-05-25 07:37:43 -0700	[diff] [blame^]	20	#include "webrtc/base/scoped_ref_ptr.h"
sprang@webrtc.org	fe5d36b	2013-10-28 09:21:07 +0000	[diff] [blame]	21	#include "webrtc/common_types.h"
kwiberg@webrtc.org	e04a93b	2014-12-09 10:12:53 +0000	[diff] [blame]	22	#include "webrtc/modules/audio_coding/neteq/audio_decoder_impl.h"
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	23	#include "webrtc/typedefs.h"
				24
				25	namespace webrtc {
				26
				27	// Forward declarations.
henrik.lundin	6d8e011	2016-03-04 10:34:21 -0800	[diff] [blame]	28	class AudioFrame;
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	29	struct WebRtcRTPHeader;
ossu	e352578	2016-05-25 07:37:43 -0700	[diff] [blame^]	30	class AudioDecoderFactory;
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	31
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	32	struct NetEqNetworkStatistics {
				33	uint16_t current_buffer_size_ms; // Current jitter buffer size in ms.
				34	uint16_t preferred_buffer_size_ms; // Target buffer size in ms.
				35	uint16_t jitter_peaks_found; // 1 if adding extra delay due to peaky
				36	// jitter; 0 otherwise.
				37	uint16_t packet_loss_rate; // Loss rate (network + late) in Q14.
				38	uint16_t packet_discard_rate; // Late loss rate in Q14.
				39	uint16_t expand_rate; // Fraction (of original stream) of synthesized
minyue@webrtc.org	7d721ee	2015-02-18 10:01:53 +0000	[diff] [blame]	40	// audio inserted through expansion (in Q14).
				41	uint16_t speech_expand_rate; // Fraction (of original stream) of synthesized
				42	// speech inserted through expansion (in Q14).
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	43	uint16_t preemptive_rate; // Fraction of data inserted through pre-emptive
				44	// expansion (in Q14).
				45	uint16_t accelerate_rate; // Fraction of data removed through acceleration
				46	// (in Q14).
minyue@webrtc.org	2c1bcf2	2015-02-17 10:17:09 +0000	[diff] [blame]	47	uint16_t secondary_decoded_rate; // Fraction of data coming from secondary
				48	// decoding (in Q14).
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	49	int32_t clockdrift_ppm; // Average clock-drift in parts-per-million
				50	// (positive or negative).
Peter Kasting	dce40cf	2015-08-24 14:52:23 -0700	[diff] [blame]	51	size_t added_zero_samples; // Number of zero samples added in "off" mode.
Henrik Lundin	1bb8cf8	2015-08-25 13:08:04 +0200	[diff] [blame]	52	// Statistics for packet waiting times, i.e., the time between a packet
				53	// arrives until it is decoded.
				54	int mean_waiting_time_ms;
				55	int median_waiting_time_ms;
				56	int min_waiting_time_ms;
				57	int max_waiting_time_ms;
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	58	};
				59
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	60	enum NetEqPlayoutMode {
				61	kPlayoutOn,
				62	kPlayoutOff,
				63	kPlayoutFax,
				64	kPlayoutStreaming
				65	};
				66
				67	// This is the interface class for NetEq.
				68	class NetEq {
				69	public:
henrik.lundin@webrtc.org	ea25784	2014-08-07 12:27:37 +0000	[diff] [blame]	70	enum BackgroundNoiseMode {
				71	kBgnOn, // Default behavior with eternal noise.
				72	kBgnFade, // Noise fades to zero after some time.
				73	kBgnOff // Background noise is always zero.
				74	};
				75
henrik.lundin@webrtc.org	35ead38	2014-04-14 18:49:17 +0000	[diff] [blame]	76	struct Config {
				77	Config()
				78	: sample_rate_hz(16000),
henrik.lundin@webrtc.org	116ed1d	2014-04-28 08:20:04 +0000	[diff] [blame]	79	enable_audio_classifier(false),
henrik.lundin	9bc2667	2015-11-02 03:25:57 -0800	[diff] [blame]	80	enable_post_decode_vad(false),
henrik.lundin@webrtc.org	116ed1d	2014-04-28 08:20:04 +0000	[diff] [blame]	81	max_packets_in_buffer(50),
				82	// \|max_delay_ms\| has the same effect as calling SetMaximumDelay().
henrik.lundin@webrtc.org	ea25784	2014-08-07 12:27:37 +0000	[diff] [blame]	83	max_delay_ms(2000),
henrik.lundin@webrtc.org	7cbc4f9	2014-10-07 06:37:39 +0000	[diff] [blame]	84	background_noise_mode(kBgnOff),
Henrik Lundin	cf808d2	2015-05-27 14:33:29 +0200	[diff] [blame]	85	playout_mode(kPlayoutOn),
				86	enable_fast_accelerate(false) {}
henrik.lundin@webrtc.org	35ead38	2014-04-14 18:49:17 +0000	[diff] [blame]	87
Henrik Lundin	905495c	2015-05-25 16:58:41 +0200	[diff] [blame]	88	std::string ToString() const;
				89
Henrik Lundin	83b5c05	2015-05-08 10:33:57 +0200	[diff] [blame]	90	int sample_rate_hz; // Initial value. Will change with input data.
henrik.lundin@webrtc.org	35ead38	2014-04-14 18:49:17 +0000	[diff] [blame]	91	bool enable_audio_classifier;
henrik.lundin	9bc2667	2015-11-02 03:25:57 -0800	[diff] [blame]	92	bool enable_post_decode_vad;
Peter Kasting	dce40cf	2015-08-24 14:52:23 -0700	[diff] [blame]	93	size_t max_packets_in_buffer;
henrik.lundin@webrtc.org	116ed1d	2014-04-28 08:20:04 +0000	[diff] [blame]	94	int max_delay_ms;
henrik.lundin@webrtc.org	ea25784	2014-08-07 12:27:37 +0000	[diff] [blame]	95	BackgroundNoiseMode background_noise_mode;
henrik.lundin@webrtc.org	7cbc4f9	2014-10-07 06:37:39 +0000	[diff] [blame]	96	NetEqPlayoutMode playout_mode;
Henrik Lundin	cf808d2	2015-05-27 14:33:29 +0200	[diff] [blame]	97	bool enable_fast_accelerate;
henrik.lundin	7a92681	2016-05-12 13:51:28 -0700	[diff] [blame]	98	bool enable_muted_state = false;
henrik.lundin@webrtc.org	35ead38	2014-04-14 18:49:17 +0000	[diff] [blame]	99	};
				100
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	101	enum ReturnCodes {
				102	kOK = 0,
				103	kFail = -1,
				104	kNotImplemented = -2
				105	};
				106
				107	enum ErrorCodes {
				108	kNoError = 0,
				109	kOtherError,
				110	kInvalidRtpPayloadType,
				111	kUnknownRtpPayloadType,
				112	kCodecNotSupported,
				113	kDecoderExists,
				114	kDecoderNotFound,
				115	kInvalidSampleRate,
				116	kInvalidPointer,
				117	kAccelerateError,
				118	kPreemptiveExpandError,
				119	kComfortNoiseErrorCode,
				120	kDecoderErrorCode,
				121	kOtherDecoderError,
				122	kInvalidOperation,
				123	kDtmfParameterError,
				124	kDtmfParsingError,
				125	kDtmfInsertError,
				126	kStereoNotSupported,
				127	kSampleUnderrun,
				128	kDecodedTooMuch,
				129	kFrameSplitError,
				130	kRedundancySplitError,
minyue@webrtc.org	7bb5436	2013-08-06 05:40:57 +0000	[diff] [blame]	131	kPacketBufferCorruption,
turaj@webrtc.org	7b75ac6	2013-09-26 00:27:56 +0000	[diff] [blame]	132	kSyncPacketNotAccepted
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	133	};
				134
henrik.lundin@webrtc.org	35ead38	2014-04-14 18:49:17 +0000	[diff] [blame]	135	// Creates a new NetEq object, with parameters set in \|config\|. The \|config\|
				136	// object will only have to be valid for the duration of the call to this
				137	// method.
ossu	e352578	2016-05-25 07:37:43 -0700	[diff] [blame^]	138	static NetEq* Create(
				139	const NetEq::Config& config,
				140	const rtc::scoped_refptr<AudioDecoderFactory>& decoder_factory);
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	141
				142	virtual ~NetEq() {}
				143
				144	// Inserts a new packet into NetEq. The \|receive_timestamp\| is an indication
				145	// of the time when the packet was received, and should be measured with
				146	// the same tick rate as the RTP timestamp of the current payload.
				147	// Returns 0 on success, -1 on failure.
				148	virtual int InsertPacket(const WebRtcRTPHeader& rtp_header,
kwiberg	ee2bac2	2015-11-11 10:34:00 -0800	[diff] [blame]	149	rtc::ArrayView<const uint8_t> payload,
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	150	uint32_t receive_timestamp) = 0;
				151
turaj@webrtc.org	7b75ac6	2013-09-26 00:27:56 +0000	[diff] [blame]	152	// Inserts a sync-packet into packet queue. Sync-packets are decoded to
				153	// silence and are intended to keep AV-sync intact in an event of long packet
				154	// losses when Video NACK is enabled but Audio NACK is not. Clients of NetEq
				155	// might insert sync-packet when they observe that buffer level of NetEq is
				156	// decreasing below a certain threshold, defined by the application.
				157	// Sync-packets should have the same payload type as the last audio payload
				158	// type, i.e. they cannot have DTMF or CNG payload type, nor a codec change
				159	// can be implied by inserting a sync-packet.
				160	// Returns kOk on success, kFail on failure.
				161	virtual int InsertSyncPacket(const WebRtcRTPHeader& rtp_header,
				162	uint32_t receive_timestamp) = 0;
				163
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	164	// Instructs NetEq to deliver 10 ms of audio data. The data is written to
henrik.lundin	7dc6889	2016-04-06 01:03:02 -0700	[diff] [blame]	165	// \|audio_frame\|. All data in \|audio_frame\| is wiped; \|data_\|, \|speech_type_\|,
				166	// \|num_channels_\|, \|sample_rate_hz_\|, \|samples_per_channel_\|, and
henrik.lundin	55480f5	2016-03-08 02:37:57 -0800	[diff] [blame]	167	// \|vad_activity_\| are updated upon success. If an error is returned, some
				168	// fields may not have been updated.
henrik.lundin	7a92681	2016-05-12 13:51:28 -0700	[diff] [blame]	169	// If muted state is enabled (through Config::enable_muted_state), \|muted\|
				170	// may be set to true after a prolonged expand period. When this happens, the
				171	// \|data_\| in \|audio_frame\| is not written, but should be interpreted as being
				172	// all zeros.
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	173	// Returns kOK on success, or kFail in case of an error.
henrik.lundin	7a92681	2016-05-12 13:51:28 -0700	[diff] [blame]	174	virtual int GetAudio(AudioFrame* audio_frame, bool* muted) = 0;
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	175
henrik.lundin	4cf61dd	2015-12-09 06:20:58 -0800	[diff] [blame]	176	// Associates \|rtp_payload_type\| with \|codec\| and \|codec_name\|, and stores the
				177	// information in the codec database. Returns 0 on success, -1 on failure.
				178	// The name is only used to provide information back to the caller about the
				179	// decoders. Hence, the name is arbitrary, and may be empty.
kwiberg	ee1879c	2015-10-29 06:20:28 -0700	[diff] [blame]	180	virtual int RegisterPayloadType(NetEqDecoder codec,
henrik.lundin	4cf61dd	2015-12-09 06:20:58 -0800	[diff] [blame]	181	const std::string& codec_name,
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	182	uint8_t rtp_payload_type) = 0;
				183
				184	// Provides an externally created decoder object \|decoder\| to insert in the
				185	// decoder database. The decoder implements a decoder of type \|codec\| and
henrik.lundin	4cf61dd	2015-12-09 06:20:58 -0800	[diff] [blame]	186	// associates it with \|rtp_payload_type\| and \|codec_name\|. The decoder will
				187	// produce samples at the rate \|sample_rate_hz\|. Returns kOK on success, kFail
				188	// on failure.
				189	// The name is only used to provide information back to the caller about the
				190	// decoders. Hence, the name is arbitrary, and may be empty.
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	191	virtual int RegisterExternalDecoder(AudioDecoder* decoder,
kwiberg	ee1879c	2015-10-29 06:20:28 -0700	[diff] [blame]	192	NetEqDecoder codec,
henrik.lundin	4cf61dd	2015-12-09 06:20:58 -0800	[diff] [blame]	193	const std::string& codec_name,
Karl Wiberg	d8399e6	2015-05-25 14:39:56 +0200	[diff] [blame]	194	uint8_t rtp_payload_type,
				195	int sample_rate_hz) = 0;
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	196
				197	// Removes \|rtp_payload_type\| from the codec database. Returns 0 on success,
				198	// -1 on failure.
				199	virtual int RemovePayloadType(uint8_t rtp_payload_type) = 0;
				200
turaj@webrtc.org	f1efc57	2013-08-16 23:44:24 +0000	[diff] [blame]	201	// Sets a minimum delay in millisecond for packet buffer. The minimum is
				202	// maintained unless a higher latency is dictated by channel condition.
				203	// Returns true if the minimum is successfully applied, otherwise false is
				204	// returned.
				205	virtual bool SetMinimumDelay(int delay_ms) = 0;
				206
				207	// Sets a maximum delay in milliseconds for packet buffer. The latency will
				208	// not exceed the given value, even required delay (given the channel
henrik.lundin@webrtc.org	116ed1d	2014-04-28 08:20:04 +0000	[diff] [blame]	209	// conditions) is higher. Calling this method has the same effect as setting
				210	// the \|max_delay_ms\| value in the NetEq::Config struct.
turaj@webrtc.org	f1efc57	2013-08-16 23:44:24 +0000	[diff] [blame]	211	virtual bool SetMaximumDelay(int delay_ms) = 0;
				212
				213	// The smallest latency required. This is computed bases on inter-arrival
				214	// time and internal NetEq logic. Note that in computing this latency none of
				215	// the user defined limits (applied by calling setMinimumDelay() and/or
				216	// SetMaximumDelay()) are applied.
				217	virtual int LeastRequiredDelayMs() const = 0;
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	218
				219	// Not implemented.
				220	virtual int SetTargetDelay() = 0;
				221
				222	// Not implemented.
				223	virtual int TargetDelay() = 0;
				224
henrik.lundin	9c3efd0	2015-08-27 13:12:22 -0700	[diff] [blame]	225	// Returns the current total delay (packet buffer and sync buffer) in ms.
				226	virtual int CurrentDelayMs() const = 0;
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	227
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	228	// Sets the playout mode to \|mode\|.
henrik.lundin@webrtc.org	7cbc4f9	2014-10-07 06:37:39 +0000	[diff] [blame]	229	// Deprecated. Set the mode in the Config struct passed to the constructor.
				230	// TODO(henrik.lundin) Delete.
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	231	virtual void SetPlayoutMode(NetEqPlayoutMode mode) = 0;
				232
				233	// Returns the current playout mode.
henrik.lundin@webrtc.org	7cbc4f9	2014-10-07 06:37:39 +0000	[diff] [blame]	234	// Deprecated.
				235	// TODO(henrik.lundin) Delete.
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	236	virtual NetEqPlayoutMode PlayoutMode() const = 0;
				237
				238	// Writes the current network statistics to \|stats\|. The statistics are reset
				239	// after the call.
				240	virtual int NetworkStatistics(NetEqNetworkStatistics* stats) = 0;
				241
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	242	// Writes the current RTCP statistics to \|stats\|. The statistics are reset
				243	// and a new report period is started with the call.
				244	virtual void GetRtcpStatistics(RtcpStatistics* stats) = 0;
				245
				246	// Same as RtcpStatistics(), but does not reset anything.
				247	virtual void GetRtcpStatisticsNoReset(RtcpStatistics* stats) = 0;
				248
				249	// Enables post-decode VAD. When enabled, GetAudio() will return
				250	// kOutputVADPassive when the signal contains no speech.
				251	virtual void EnableVad() = 0;
				252
				253	// Disables post-decode VAD.
				254	virtual void DisableVad() = 0;
				255
henrik.lundin	9a410dd	2016-04-06 01:39:22 -0700	[diff] [blame]	256	// Returns the RTP timestamp for the last sample delivered by GetAudio().
				257	// The return value will be empty if no valid timestamp is available.
henrik.lundin	15c51e3	2016-04-06 08:38:56 -0700	[diff] [blame]	258	virtual rtc::Optional<uint32_t> GetPlayoutTimestamp() const = 0;
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	259
henrik.lundin	d89814b	2015-11-23 06:49:25 -0800	[diff] [blame]	260	// Returns the sample rate in Hz of the audio produced in the last GetAudio
				261	// call. If GetAudio has not been called yet, the configured sample rate
				262	// (Config::sample_rate_hz) is returned.
				263	virtual int last_output_sample_rate_hz() const = 0;
				264
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	265	// Not implemented.
				266	virtual int SetTargetNumberOfChannels() = 0;
				267
				268	// Not implemented.
				269	virtual int SetTargetSampleRate() = 0;
				270
				271	// Returns the error code for the last occurred error. If no error has
				272	// occurred, 0 is returned.
henrik.lundin@webrtc.org	b0f4b3d	2014-11-04 08:53:10 +0000	[diff] [blame]	273	virtual int LastError() const = 0;
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	274
				275	// Returns the error code last returned by a decoder (audio or comfort noise).
				276	// When LastError() returns kDecoderErrorCode or kComfortNoiseErrorCode, check
				277	// this method to get the decoder's error code.
				278	virtual int LastDecoderError() = 0;
				279
				280	// Flushes both the packet buffer and the sync buffer.
				281	virtual void FlushBuffers() = 0;
				282
turaj@webrtc.org	7df9706	2013-08-02 18:07:13 +0000	[diff] [blame]	283	// Current usage of packet-buffer and it's limits.
				284	virtual void PacketBufferStatistics(int* current_num_packets,
henrik.lundin@webrtc.org	116ed1d	2014-04-28 08:20:04 +0000	[diff] [blame]	285	int* max_num_packets) const = 0;
turaj@webrtc.org	7df9706	2013-08-02 18:07:13 +0000	[diff] [blame]	286
henrik.lundin	48ed930	2015-10-29 05:36:24 -0700	[diff] [blame]	287	// Enables NACK and sets the maximum size of the NACK list, which should be
				288	// positive and no larger than Nack::kNackListSizeLimit. If NACK is already
				289	// enabled then the maximum NACK list size is modified accordingly.
				290	virtual void EnableNack(size_t max_nack_list_size) = 0;
				291
				292	virtual void DisableNack() = 0;
				293
				294	// Returns a list of RTP sequence numbers corresponding to packets to be
				295	// retransmitted, given an estimate of the round-trip time in milliseconds.
				296	virtual std::vector<uint16_t> GetNackList(
				297	int64_t round_trip_time_ms) const = 0;
minyue@webrtc.org	d730177	2013-08-29 00:58:14 +0000	[diff] [blame]	298
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	299	protected:
				300	NetEq() {}
				301
				302	private:
henrikg	3c089d7	2015-09-16 05:37:44 -0700	[diff] [blame]	303	RTC_DISALLOW_COPY_AND_ASSIGN(NetEq);
henrik.lundin@webrtc.org	d94659d	2013-01-29 12:09:21 +0000	[diff] [blame]	304	};
				305
				306	} // namespace webrtc
Henrik Kjellander	7464089	2015-10-29 11:31:02 +0100	[diff] [blame]	307	#endif // WEBRTC_MODULES_AUDIO_CODING_NETEQ_INCLUDE_NETEQ_H_