Blame - webrtc/modules/audio_coding/codecs/audio_encoder.h - webrtc.googlesource.com/src

blob: e8a2c6ea1e6d59ea70f21d1da33247e9006fe515 [file] [log] [blame]

henrik.lundin@webrtc.org	9ea6f8a	2014-10-16 11:26:24 +0000	[diff] [blame]	1	/*
				2	* Copyright (c) 2014 The WebRTC project authors. All Rights Reserved.
				3	*
				4	* Use of this source code is governed by a BSD-style license
				5	* that can be found in the LICENSE file in the root of the source
				6	* tree. An additional intellectual property rights grant can be found
				7	* in the file PATENTS. All contributing project authors may
				8	* be found in the AUTHORS file in the root of the source tree.
				9	*/
				10
				11	#ifndef WEBRTC_MODULES_AUDIO_CODING_CODECS_AUDIO_ENCODER_H_
				12	#define WEBRTC_MODULES_AUDIO_CODING_CODECS_AUDIO_ENCODER_H_
				13
				14	#include <algorithm>
henrik.lundin@webrtc.org	c1c9291	2014-12-16 13:41:36 +0000	[diff] [blame]	15	#include <vector>
henrik.lundin@webrtc.org	9ea6f8a	2014-10-16 11:26:24 +0000	[diff] [blame]	16
henrik.lundin@webrtc.org	9ea6f8a	2014-10-16 11:26:24 +0000	[diff] [blame]	17	#include "webrtc/typedefs.h"
				18
				19	namespace webrtc {
				20
				21	// This is the interface class for encoders in AudioCoding module. Each codec
henrik.lundin@webrtc.org	c1c9291	2014-12-16 13:41:36 +0000	[diff] [blame]	22	// type must have an implementation of this class.
henrik.lundin@webrtc.org	9ea6f8a	2014-10-16 11:26:24 +0000	[diff] [blame]	23	class AudioEncoder {
				24	public:
henrik.lundin@webrtc.org	c1c9291	2014-12-16 13:41:36 +0000	[diff] [blame]	25	struct EncodedInfoLeaf {
				26	EncodedInfoLeaf()
henrik.lundin@webrtc.org	bb1219e	2015-02-12 15:53:25 +0000	[diff] [blame]	27	: encoded_bytes(0),
				28	encoded_timestamp(0),
				29	payload_type(0),
henrik.lundin@webrtc.org	c86bbba	2015-03-04 16:02:42 +0000	[diff] [blame]	30	send_even_if_empty(false),
				31	speech(true) {}
henrik.lundin@webrtc.org	3b79daf	2014-12-12 13:31:24 +0000	[diff] [blame]	32
				33	size_t encoded_bytes;
henrik.lundin@webrtc.org	1db20a4	2014-12-01 14:44:50 +0000	[diff] [blame]	34	uint32_t encoded_timestamp;
henrik.lundin@webrtc.org	7f1dfa5	2014-12-02 12:08:39 +0000	[diff] [blame]	35	int payload_type;
henrik.lundin@webrtc.org	bb1219e	2015-02-12 15:53:25 +0000	[diff] [blame]	36	bool send_even_if_empty;
henrik.lundin@webrtc.org	c86bbba	2015-03-04 16:02:42 +0000	[diff] [blame]	37	bool speech;
henrik.lundin@webrtc.org	1db20a4	2014-12-01 14:44:50 +0000	[diff] [blame]	38	};
				39
henrik.lundin@webrtc.org	c1c9291	2014-12-16 13:41:36 +0000	[diff] [blame]	40	// This is the main struct for auxiliary encoding information. Each encoded
				41	// packet should be accompanied by one EncodedInfo struct, containing the
				42	// total number of \|encoded_bytes\|, the \|encoded_timestamp\| and the
				43	// \|payload_type\|. If the packet contains redundant encodings, the \|redundant\|
				44	// vector will be populated with EncodedInfoLeaf structs. Each struct in the
				45	// vector represents one encoding; the order of structs in the vector is the
				46	// same as the order in which the actual payloads are written to the byte
				47	// stream. When EncoderInfoLeaf structs are present in the vector, the main
				48	// struct's \|encoded_bytes\| will be the sum of all the \|encoded_bytes\| in the
				49	// vector.
				50	struct EncodedInfo : public EncodedInfoLeaf {
				51	EncodedInfo();
				52	~EncodedInfo();
				53
				54	std::vector<EncodedInfoLeaf> redundant;
				55	};
				56
henrik.lundin@webrtc.org	9ea6f8a	2014-10-16 11:26:24 +0000	[diff] [blame]	57	virtual ~AudioEncoder() {}
				58
				59	// Accepts one 10 ms block of input audio (i.e., sample_rate_hz() / 100 *
				60	// num_channels() samples). Multi-channel audio must be sample-interleaved.
jmarusic@webrtc.org	9afaee7	2015-03-19 08:50:26 +0000	[diff] [blame^]	61	// The encoder produces zero or more bytes of output in \|encoded\| and
				62	// returns additional encoding information.
jmarusic@webrtc.org	b1f0de3	2015-02-26 15:38:10 +0000	[diff] [blame]	63	// The caller is responsible for making sure that \|max_encoded_bytes\| is
				64	// not smaller than the number of bytes actually produced by the encoder.
jmarusic@webrtc.org	9afaee7	2015-03-19 08:50:26 +0000	[diff] [blame^]	65	EncodedInfo Encode(uint32_t rtp_timestamp,
				66	const int16_t* audio,
				67	size_t num_samples_per_channel,
				68	size_t max_encoded_bytes,
				69	uint8_t* encoded);
henrik.lundin@webrtc.org	9ea6f8a	2014-10-16 11:26:24 +0000	[diff] [blame]	70
kwiberg@webrtc.org	decd930	2014-10-29 08:38:50 +0000	[diff] [blame]	71	// Return the input sample rate in Hz and the number of input channels.
				72	// These are constants set at instantiation time.
kwiberg@webrtc.org	0521127	2015-02-18 12:00:32 +0000	[diff] [blame]	73	virtual int SampleRateHz() const = 0;
				74	virtual int NumChannels() const = 0;
kwiberg@webrtc.org	decd930	2014-10-29 08:38:50 +0000	[diff] [blame]	75
jmarusic@webrtc.org	51ccf37	2015-03-10 15:41:26 +0000	[diff] [blame]	76	// Return the maximum number of bytes that can be produced by the encoder
				77	// at each Encode() call. The caller can use the return value to determine
				78	// the size of the buffer that needs to be allocated. This value is allowed
				79	// to depend on encoder parameters like bitrate, frame size etc., so if
				80	// any of these change, the caller of Encode() is responsible for checking
				81	// that the buffer is large enough by calling MaxEncodedBytes() again.
				82	virtual size_t MaxEncodedBytes() const = 0;
				83
henrik.lundin@webrtc.org	478cedc	2015-01-27 18:24:45 +0000	[diff] [blame]	84	// Returns the rate with which the RTP timestamps are updated. By default,
				85	// this is the same as sample_rate_hz().
kwiberg@webrtc.org	0521127	2015-02-18 12:00:32 +0000	[diff] [blame]	86	virtual int RtpTimestampRateHz() const;
henrik.lundin@webrtc.org	478cedc	2015-01-27 18:24:45 +0000	[diff] [blame]	87
kwiberg@webrtc.org	decd930	2014-10-29 08:38:50 +0000	[diff] [blame]	88	// Returns the number of 10 ms frames the encoder will put in the next
				89	// packet. This value may only change when Encode() outputs a packet; i.e.,
				90	// the encoder may vary the number of 10 ms frames from packet to packet, but
				91	// it must decide the length of the next packet no later than when outputting
				92	// the preceding packet.
				93	virtual int Num10MsFramesInNextPacket() const = 0;
henrik.lundin@webrtc.org	9ea6f8a	2014-10-16 11:26:24 +0000	[diff] [blame]	94
henrik.lundin@webrtc.org	8911bc5	2014-12-08 21:15:55 +0000	[diff] [blame]	95	// Returns the maximum value that can be returned by
				96	// Num10MsFramesInNextPacket().
				97	virtual int Max10MsFramesInAPacket() const = 0;
				98
henrik.lundin@webrtc.org	478cedc	2015-01-27 18:24:45 +0000	[diff] [blame]	99	// Changes the target bitrate. The implementation is free to alter this value,
				100	// e.g., if the desired value is outside the valid range.
				101	virtual void SetTargetBitrate(int bits_per_second) {}
				102
				103	// Tells the implementation what the projected packet loss rate is. The rate
				104	// is in the range [0.0, 1.0]. This rate is typically used to adjust channel
				105	// coding efforts, such as FEC.
				106	virtual void SetProjectedPacketLossRate(double fraction) {}
				107
henrik.lundin@webrtc.org	9ea6f8a	2014-10-16 11:26:24 +0000	[diff] [blame]	108	protected:
jmarusic@webrtc.org	9afaee7	2015-03-19 08:50:26 +0000	[diff] [blame^]	109	virtual EncodedInfo EncodeInternal(uint32_t rtp_timestamp,
				110	const int16_t* audio,
				111	size_t max_encoded_bytes,
				112	uint8_t* encoded) = 0;
henrik.lundin@webrtc.org	9ea6f8a	2014-10-16 11:26:24 +0000	[diff] [blame]	113	};
				114
				115	} // namespace webrtc
				116	#endif // WEBRTC_MODULES_AUDIO_CODING_CODECS_AUDIO_ENCODER_H_