blob: d27ccca23f7485509985d469916be780c95636b9 [file] [log] [blame]
niklase@google.com470e71d2011-07-07 08:21:25 +00001/*
2 * Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020011#ifndef MODULES_AUDIO_PROCESSING_AUDIO_BUFFER_H_
12#define MODULES_AUDIO_PROCESSING_AUDIO_BUFFER_H_
niklase@google.com470e71d2011-07-07 08:21:25 +000013
Yves Gerey988cc082018-10-23 12:03:01 +020014#include <stddef.h>
15#include <stdint.h>
Jonas Olssona4d87372019-07-05 19:08:33 +020016
kwiberg88788ad2016-02-19 07:04:49 -080017#include <memory>
kwiberg4a206a92016-03-31 10:24:26 -070018#include <vector>
kwiberg88788ad2016-02-19 07:04:49 -080019
Fredrik Solenbergbbf21a32018-04-12 22:44:09 +020020#include "api/audio/audio_frame.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020021#include "common_audio/channel_buffer.h"
22#include "modules/audio_processing/include/audio_processing.h"
niklase@google.com470e71d2011-07-07 08:21:25 +000023
niklase@google.com470e71d2011-07-07 08:21:25 +000024namespace webrtc {
25
Yves Gerey988cc082018-10-23 12:03:01 +020026class PushSincResampler;
27class SplittingFilter;
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +000028
Yves Gerey665174f2018-06-19 15:03:05 +020029enum Band { kBand0To8kHz = 0, kBand8To16kHz = 1, kBand16To24kHz = 2 };
aluebs@webrtc.orga7384a12014-12-03 01:06:35 +000030
Per Åhgrend47941e2019-08-22 11:51:13 +020031// Stores any audio data in a way that allows the audio processing module to
32// operate on it in a controlled manner.
niklase@google.com470e71d2011-07-07 08:21:25 +000033class AudioBuffer {
34 public:
Per Åhgren0aefbf02019-08-23 21:29:17 +020035 static const int kSplitBandSize = 160;
Per Åhgren3e8bf282019-08-29 23:38:40 +020036 static const size_t kMaxSampleRate = 384000;
Per Åhgrend47941e2019-08-22 11:51:13 +020037 AudioBuffer(size_t input_rate,
38 size_t input_num_channels,
39 size_t buffer_rate,
40 size_t buffer_num_channels,
41 size_t output_rate,
42 size_t output_num_channels);
43
44 // The constructor below will be deprecated.
Steve Antonf254e9e2019-08-21 17:52:28 +000045 AudioBuffer(size_t input_num_frames,
Per Åhgrend47941e2019-08-22 11:51:13 +020046 size_t input_num_channels,
47 size_t buffer_num_frames,
48 size_t buffer_num_channels,
Steve Antonf254e9e2019-08-21 17:52:28 +000049 size_t output_num_frames);
niklase@google.com470e71d2011-07-07 08:21:25 +000050 virtual ~AudioBuffer();
51
Per Åhgrend47941e2019-08-22 11:51:13 +020052 AudioBuffer(const AudioBuffer&) = delete;
53 AudioBuffer& operator=(const AudioBuffer&) = delete;
Per Åhgren81c0cf22019-08-21 15:02:37 +020054
Per Åhgrend47941e2019-08-22 11:51:13 +020055 // Specify that downmixing should be done by selecting a single channel.
56 void set_downmixing_to_specific_channel(size_t channel);
57
58 // Specify that downmixing should be done by averaging all channels,.
59 void set_downmixing_by_averaging();
60
61 // Set the number of channels in the buffer. The specified number of channels
62 // cannot be larger than the specified buffer_num_channels. The number is also
63 // reset at each call to CopyFrom or InterleaveFrom.
64 void set_num_channels(size_t num_channels);
65
66 size_t num_channels() const { return num_channels_; }
67 size_t num_frames() const { return buffer_num_frames_; }
68 size_t num_frames_per_band() const { return num_split_frames_; }
69 size_t num_bands() const { return num_bands_; }
70
71 // Returns pointer arrays to the full-band channels.
aluebs@webrtc.org3aca0b02015-02-26 21:52:20 +000072 // Usage:
73 // channels()[channel][sample].
74 // Where:
Per Åhgrend47941e2019-08-22 11:51:13 +020075 // 0 <= channel < |buffer_num_channels_|
76 // 0 <= sample < |buffer_num_frames_|
77 float* const* channels() { return data_->channels(); }
78 const float* const* channels_const() const { return data_->channels(); }
aluebs@webrtc.org3aca0b02015-02-26 21:52:20 +000079
Per Åhgrend47941e2019-08-22 11:51:13 +020080 // Returns pointer arrays to the bands for a specific channel.
aluebs@webrtc.org3aca0b02015-02-26 21:52:20 +000081 // Usage:
82 // split_bands(channel)[band][sample].
83 // Where:
Per Åhgrend47941e2019-08-22 11:51:13 +020084 // 0 <= channel < |buffer_num_channels_|
aluebs@webrtc.org3aca0b02015-02-26 21:52:20 +000085 // 0 <= band < |num_bands_|
86 // 0 <= sample < |num_split_frames_|
Per Åhgrend47941e2019-08-22 11:51:13 +020087 const float* const* split_bands_const(size_t channel) const {
88 return split_data_.get() ? split_data_->bands(channel)
89 : data_->bands(channel);
90 }
91 float* const* split_bands(size_t channel) {
92 return split_data_.get() ? split_data_->bands(channel)
93 : data_->bands(channel);
94 }
aluebs@webrtc.org3aca0b02015-02-26 21:52:20 +000095
96 // Returns a pointer array to the channels for a specific band.
97 // Usage:
98 // split_channels(band)[channel][sample].
99 // Where:
100 // 0 <= band < |num_bands_|
Per Åhgrend47941e2019-08-22 11:51:13 +0200101 // 0 <= channel < |buffer_num_channels_|
aluebs@webrtc.org3aca0b02015-02-26 21:52:20 +0000102 // 0 <= sample < |num_split_frames_|
Per Åhgrend47941e2019-08-22 11:51:13 +0200103 const float* const* split_channels_const(Band band) const {
104 if (split_data_.get()) {
105 return split_data_->channels(band);
106 } else {
107 return band == kBand0To8kHz ? data_->channels() : nullptr;
108 }
109 }
andrew@webrtc.org755b04a2011-11-15 16:57:56 +0000110
Per Åhgrend47941e2019-08-22 11:51:13 +0200111 // Copies data into the buffer.
112 void CopyFrom(const AudioFrame* frame);
Michael Graczyk86c6d332015-07-23 11:41:39 -0700113 void CopyFrom(const float* const* data, const StreamConfig& stream_config);
Per Åhgrend47941e2019-08-22 11:51:13 +0200114
115 // Copies data from the buffer.
116 void CopyTo(AudioFrame* frame) const;
Michael Graczyk86c6d332015-07-23 11:41:39 -0700117 void CopyTo(const StreamConfig& stream_config, float* const* data);
Gustaf Ullberg422b9e02019-10-09 13:02:14 +0200118 void CopyTo(AudioBuffer* buffer) const;
niklase@google.com470e71d2011-07-07 08:21:25 +0000119
Per Åhgrend47941e2019-08-22 11:51:13 +0200120 // Splits the buffer data into frequency bands.
aluebs@webrtc.orgbe05c742014-11-14 22:18:10 +0000121 void SplitIntoFrequencyBands();
Per Åhgrend47941e2019-08-22 11:51:13 +0200122
123 // Recombines the frequency bands into a full-band signal.
aluebs@webrtc.orgbe05c742014-11-14 22:18:10 +0000124 void MergeFrequencyBands();
125
Per Åhgren928146f2019-08-20 09:19:21 +0200126 // Copies the split bands data into the integer two-dimensional array.
Per Åhgrend47941e2019-08-22 11:51:13 +0200127 void ExportSplitChannelData(size_t channel, int16_t* const* split_band_data);
Per Åhgren928146f2019-08-20 09:19:21 +0200128
129 // Copies the data in the integer two-dimensional array into the split_bands
130 // data.
Per Åhgrend47941e2019-08-22 11:51:13 +0200131 void ImportSplitChannelData(size_t channel,
132 const int16_t* const* split_band_data);
Per Åhgren928146f2019-08-20 09:19:21 +0200133
134 static const size_t kMaxSplitFrameLength = 160;
135 static const size_t kMaxNumBands = 3;
136
Per Åhgrend47941e2019-08-22 11:51:13 +0200137 // Deprecated methods, will be removed soon.
138 float* const* channels_f() { return channels(); }
139 const float* const* channels_const_f() const { return channels_const(); }
140 const float* const* split_bands_const_f(size_t channel) const {
141 return split_bands_const(channel);
142 }
143 float* const* split_bands_f(size_t channel) { return split_bands(channel); }
144 const float* const* split_channels_const_f(Band band) const {
145 return split_channels_const(band);
146 }
147 void DeinterleaveFrom(const AudioFrame* frame) { CopyFrom(frame); }
148 void InterleaveTo(AudioFrame* frame) const { CopyTo(frame); }
149
niklase@google.com470e71d2011-07-07 08:21:25 +0000150 private:
Alejandro Luebsa181c9a2016-06-30 15:33:37 -0700151 FRIEND_TEST_ALL_PREFIXES(AudioBufferTest,
152 SetNumChannelsSetsChannelBuffersNumChannels);
Per Åhgrend47941e2019-08-22 11:51:13 +0200153 void RestoreNumChannels();
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000154
Peter Kastingdce40cf2015-08-24 14:52:23 -0700155 const size_t input_num_frames_;
Per Åhgrend47941e2019-08-22 11:51:13 +0200156 const size_t input_num_channels_;
157 const size_t buffer_num_frames_;
158 const size_t buffer_num_channels_;
Peter Kastingdce40cf2015-08-24 14:52:23 -0700159 const size_t output_num_frames_;
Per Åhgrend47941e2019-08-22 11:51:13 +0200160 const size_t output_num_channels_;
Steve Antonf254e9e2019-08-21 17:52:28 +0000161
Per Åhgrend47941e2019-08-22 11:51:13 +0200162 size_t num_channels_;
Peter Kastingdce40cf2015-08-24 14:52:23 -0700163 size_t num_bands_;
164 size_t num_split_frames_;
niklase@google.com470e71d2011-07-07 08:21:25 +0000165
Per Åhgrend47941e2019-08-22 11:51:13 +0200166 std::unique_ptr<ChannelBuffer<float>> data_;
167 std::unique_ptr<ChannelBuffer<float>> split_data_;
kwiberg88788ad2016-02-19 07:04:49 -0800168 std::unique_ptr<SplittingFilter> splitting_filter_;
kwiberg4a206a92016-03-31 10:24:26 -0700169 std::vector<std::unique_ptr<PushSincResampler>> input_resamplers_;
170 std::vector<std::unique_ptr<PushSincResampler>> output_resamplers_;
Per Åhgrend47941e2019-08-22 11:51:13 +0200171 bool downmix_by_averaging_ = true;
172 size_t channel_for_downmixing_ = 0;
niklase@google.com470e71d2011-07-07 08:21:25 +0000173};
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +0000174
niklase@google.com470e71d2011-07-07 08:21:25 +0000175} // namespace webrtc
176
Mirko Bonadei92ea95e2017-09-15 06:47:31 +0200177#endif // MODULES_AUDIO_PROCESSING_AUDIO_BUFFER_H_