niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (c) 2011 The WebRTC project authors. All Rights Reserved. |
| 3 | * |
| 4 | * Use of this source code is governed by a BSD-style license |
| 5 | * that can be found in the LICENSE file in the root of the source |
| 6 | * tree. An additional intellectual property rights grant can be found |
| 7 | * in the file PATENTS. All contributing project authors may |
| 8 | * be found in the AUTHORS file in the root of the source tree. |
| 9 | */ |
| 10 | |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 11 | #ifndef MODULES_AUDIO_PROCESSING_AUDIO_BUFFER_H_ |
| 12 | #define MODULES_AUDIO_PROCESSING_AUDIO_BUFFER_H_ |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 13 | |
Yves Gerey | 988cc08 | 2018-10-23 12:03:01 +0200 | [diff] [blame] | 14 | #include <stddef.h> |
| 15 | #include <stdint.h> |
Jonas Olsson | a4d8737 | 2019-07-05 19:08:33 +0200 | [diff] [blame] | 16 | |
kwiberg | 88788ad | 2016-02-19 07:04:49 -0800 | [diff] [blame] | 17 | #include <memory> |
kwiberg | 4a206a9 | 2016-03-31 10:24:26 -0700 | [diff] [blame] | 18 | #include <vector> |
kwiberg | 88788ad | 2016-02-19 07:04:49 -0800 | [diff] [blame] | 19 | |
Fredrik Solenberg | bbf21a3 | 2018-04-12 22:44:09 +0200 | [diff] [blame] | 20 | #include "api/audio/audio_frame.h" |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 21 | #include "common_audio/channel_buffer.h" |
| 22 | #include "modules/audio_processing/include/audio_processing.h" |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 23 | |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 24 | namespace webrtc { |
| 25 | |
Yves Gerey | 988cc08 | 2018-10-23 12:03:01 +0200 | [diff] [blame] | 26 | class PushSincResampler; |
| 27 | class SplittingFilter; |
andrew@webrtc.org | ddbb8a2 | 2014-04-22 21:00:04 +0000 | [diff] [blame] | 28 | |
Yves Gerey | 665174f | 2018-06-19 15:03:05 +0200 | [diff] [blame] | 29 | enum Band { kBand0To8kHz = 0, kBand8To16kHz = 1, kBand16To24kHz = 2 }; |
aluebs@webrtc.org | a7384a1 | 2014-12-03 01:06:35 +0000 | [diff] [blame] | 30 | |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 31 | // Stores any audio data in a way that allows the audio processing module to |
| 32 | // operate on it in a controlled manner. |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 33 | class AudioBuffer { |
| 34 | public: |
Per Åhgren | 0aefbf0 | 2019-08-23 21:29:17 +0200 | [diff] [blame^] | 35 | static const int kSplitBandSize = 160; |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 36 | AudioBuffer(size_t input_rate, |
| 37 | size_t input_num_channels, |
| 38 | size_t buffer_rate, |
| 39 | size_t buffer_num_channels, |
| 40 | size_t output_rate, |
| 41 | size_t output_num_channels); |
| 42 | |
| 43 | // The constructor below will be deprecated. |
Steve Anton | f254e9e | 2019-08-21 17:52:28 +0000 | [diff] [blame] | 44 | AudioBuffer(size_t input_num_frames, |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 45 | size_t input_num_channels, |
| 46 | size_t buffer_num_frames, |
| 47 | size_t buffer_num_channels, |
Steve Anton | f254e9e | 2019-08-21 17:52:28 +0000 | [diff] [blame] | 48 | size_t output_num_frames); |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 49 | virtual ~AudioBuffer(); |
| 50 | |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 51 | AudioBuffer(const AudioBuffer&) = delete; |
| 52 | AudioBuffer& operator=(const AudioBuffer&) = delete; |
Per Åhgren | 81c0cf2 | 2019-08-21 15:02:37 +0200 | [diff] [blame] | 53 | |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 54 | // Specify that downmixing should be done by selecting a single channel. |
| 55 | void set_downmixing_to_specific_channel(size_t channel); |
| 56 | |
| 57 | // Specify that downmixing should be done by averaging all channels,. |
| 58 | void set_downmixing_by_averaging(); |
| 59 | |
| 60 | // Set the number of channels in the buffer. The specified number of channels |
| 61 | // cannot be larger than the specified buffer_num_channels. The number is also |
| 62 | // reset at each call to CopyFrom or InterleaveFrom. |
| 63 | void set_num_channels(size_t num_channels); |
| 64 | |
| 65 | size_t num_channels() const { return num_channels_; } |
| 66 | size_t num_frames() const { return buffer_num_frames_; } |
| 67 | size_t num_frames_per_band() const { return num_split_frames_; } |
| 68 | size_t num_bands() const { return num_bands_; } |
| 69 | |
| 70 | // Returns pointer arrays to the full-band channels. |
aluebs@webrtc.org | 3aca0b0 | 2015-02-26 21:52:20 +0000 | [diff] [blame] | 71 | // Usage: |
| 72 | // channels()[channel][sample]. |
| 73 | // Where: |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 74 | // 0 <= channel < |buffer_num_channels_| |
| 75 | // 0 <= sample < |buffer_num_frames_| |
| 76 | float* const* channels() { return data_->channels(); } |
| 77 | const float* const* channels_const() const { return data_->channels(); } |
aluebs@webrtc.org | 3aca0b0 | 2015-02-26 21:52:20 +0000 | [diff] [blame] | 78 | |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 79 | // Returns pointer arrays to the bands for a specific channel. |
aluebs@webrtc.org | 3aca0b0 | 2015-02-26 21:52:20 +0000 | [diff] [blame] | 80 | // Usage: |
| 81 | // split_bands(channel)[band][sample]. |
| 82 | // Where: |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 83 | // 0 <= channel < |buffer_num_channels_| |
aluebs@webrtc.org | 3aca0b0 | 2015-02-26 21:52:20 +0000 | [diff] [blame] | 84 | // 0 <= band < |num_bands_| |
| 85 | // 0 <= sample < |num_split_frames_| |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 86 | const float* const* split_bands_const(size_t channel) const { |
| 87 | return split_data_.get() ? split_data_->bands(channel) |
| 88 | : data_->bands(channel); |
| 89 | } |
| 90 | float* const* split_bands(size_t channel) { |
| 91 | return split_data_.get() ? split_data_->bands(channel) |
| 92 | : data_->bands(channel); |
| 93 | } |
aluebs@webrtc.org | 3aca0b0 | 2015-02-26 21:52:20 +0000 | [diff] [blame] | 94 | |
| 95 | // Returns a pointer array to the channels for a specific band. |
| 96 | // Usage: |
| 97 | // split_channels(band)[channel][sample]. |
| 98 | // Where: |
| 99 | // 0 <= band < |num_bands_| |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 100 | // 0 <= channel < |buffer_num_channels_| |
aluebs@webrtc.org | 3aca0b0 | 2015-02-26 21:52:20 +0000 | [diff] [blame] | 101 | // 0 <= sample < |num_split_frames_| |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 102 | const float* const* split_channels_const(Band band) const { |
| 103 | if (split_data_.get()) { |
| 104 | return split_data_->channels(band); |
| 105 | } else { |
| 106 | return band == kBand0To8kHz ? data_->channels() : nullptr; |
| 107 | } |
| 108 | } |
andrew@webrtc.org | 755b04a | 2011-11-15 16:57:56 +0000 | [diff] [blame] | 109 | |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 110 | // Copies data into the buffer. |
| 111 | void CopyFrom(const AudioFrame* frame); |
Michael Graczyk | 86c6d33 | 2015-07-23 11:41:39 -0700 | [diff] [blame] | 112 | void CopyFrom(const float* const* data, const StreamConfig& stream_config); |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 113 | |
| 114 | // Copies data from the buffer. |
| 115 | void CopyTo(AudioFrame* frame) const; |
Michael Graczyk | 86c6d33 | 2015-07-23 11:41:39 -0700 | [diff] [blame] | 116 | void CopyTo(const StreamConfig& stream_config, float* const* data); |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 117 | |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 118 | // Splits the buffer data into frequency bands. |
aluebs@webrtc.org | be05c74 | 2014-11-14 22:18:10 +0000 | [diff] [blame] | 119 | void SplitIntoFrequencyBands(); |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 120 | |
| 121 | // Recombines the frequency bands into a full-band signal. |
aluebs@webrtc.org | be05c74 | 2014-11-14 22:18:10 +0000 | [diff] [blame] | 122 | void MergeFrequencyBands(); |
| 123 | |
Per Åhgren | 928146f | 2019-08-20 09:19:21 +0200 | [diff] [blame] | 124 | // Copies the split bands data into the integer two-dimensional array. |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 125 | void ExportSplitChannelData(size_t channel, int16_t* const* split_band_data); |
Per Åhgren | 928146f | 2019-08-20 09:19:21 +0200 | [diff] [blame] | 126 | |
| 127 | // Copies the data in the integer two-dimensional array into the split_bands |
| 128 | // data. |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 129 | void ImportSplitChannelData(size_t channel, |
| 130 | const int16_t* const* split_band_data); |
Per Åhgren | 928146f | 2019-08-20 09:19:21 +0200 | [diff] [blame] | 131 | |
| 132 | static const size_t kMaxSplitFrameLength = 160; |
| 133 | static const size_t kMaxNumBands = 3; |
| 134 | |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 135 | // Deprecated methods, will be removed soon. |
| 136 | float* const* channels_f() { return channels(); } |
| 137 | const float* const* channels_const_f() const { return channels_const(); } |
| 138 | const float* const* split_bands_const_f(size_t channel) const { |
| 139 | return split_bands_const(channel); |
| 140 | } |
| 141 | float* const* split_bands_f(size_t channel) { return split_bands(channel); } |
| 142 | const float* const* split_channels_const_f(Band band) const { |
| 143 | return split_channels_const(band); |
| 144 | } |
| 145 | void DeinterleaveFrom(const AudioFrame* frame) { CopyFrom(frame); } |
| 146 | void InterleaveTo(AudioFrame* frame) const { CopyTo(frame); } |
| 147 | |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 148 | private: |
Alejandro Luebs | a181c9a | 2016-06-30 15:33:37 -0700 | [diff] [blame] | 149 | FRIEND_TEST_ALL_PREFIXES(AudioBufferTest, |
| 150 | SetNumChannelsSetsChannelBuffersNumChannels); |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 151 | void RestoreNumChannels(); |
andrew@webrtc.org | 17e4064 | 2014-03-04 20:58:13 +0000 | [diff] [blame] | 152 | |
Peter Kasting | dce40cf | 2015-08-24 14:52:23 -0700 | [diff] [blame] | 153 | const size_t input_num_frames_; |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 154 | const size_t input_num_channels_; |
| 155 | const size_t buffer_num_frames_; |
| 156 | const size_t buffer_num_channels_; |
Peter Kasting | dce40cf | 2015-08-24 14:52:23 -0700 | [diff] [blame] | 157 | const size_t output_num_frames_; |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 158 | const size_t output_num_channels_; |
Steve Anton | f254e9e | 2019-08-21 17:52:28 +0000 | [diff] [blame] | 159 | |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 160 | size_t num_channels_; |
Peter Kasting | dce40cf | 2015-08-24 14:52:23 -0700 | [diff] [blame] | 161 | size_t num_bands_; |
| 162 | size_t num_split_frames_; |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 163 | |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 164 | std::unique_ptr<ChannelBuffer<float>> data_; |
| 165 | std::unique_ptr<ChannelBuffer<float>> split_data_; |
kwiberg | 88788ad | 2016-02-19 07:04:49 -0800 | [diff] [blame] | 166 | std::unique_ptr<SplittingFilter> splitting_filter_; |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 167 | std::unique_ptr<ChannelBuffer<float>> output_buffer_; |
kwiberg | 4a206a9 | 2016-03-31 10:24:26 -0700 | [diff] [blame] | 168 | std::vector<std::unique_ptr<PushSincResampler>> input_resamplers_; |
| 169 | std::vector<std::unique_ptr<PushSincResampler>> output_resamplers_; |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 170 | bool downmix_by_averaging_ = true; |
| 171 | size_t channel_for_downmixing_ = 0; |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 172 | }; |
andrew@webrtc.org | ddbb8a2 | 2014-04-22 21:00:04 +0000 | [diff] [blame] | 173 | |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 174 | } // namespace webrtc |
| 175 | |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 176 | #endif // MODULES_AUDIO_PROCESSING_AUDIO_BUFFER_H_ |