niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (c) 2011 The WebRTC project authors. All Rights Reserved. |
| 3 | * |
| 4 | * Use of this source code is governed by a BSD-style license |
| 5 | * that can be found in the LICENSE file in the root of the source |
| 6 | * tree. An additional intellectual property rights grant can be found |
| 7 | * in the file PATENTS. All contributing project authors may |
| 8 | * be found in the AUTHORS file in the root of the source tree. |
| 9 | */ |
| 10 | |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 11 | #ifndef MODULES_AUDIO_PROCESSING_AUDIO_BUFFER_H_ |
| 12 | #define MODULES_AUDIO_PROCESSING_AUDIO_BUFFER_H_ |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 13 | |
Yves Gerey | 988cc08 | 2018-10-23 12:03:01 +0200 | [diff] [blame] | 14 | #include <stddef.h> |
| 15 | #include <stdint.h> |
Jonas Olsson | a4d8737 | 2019-07-05 19:08:33 +0200 | [diff] [blame] | 16 | |
kwiberg | 88788ad | 2016-02-19 07:04:49 -0800 | [diff] [blame] | 17 | #include <memory> |
kwiberg | 4a206a9 | 2016-03-31 10:24:26 -0700 | [diff] [blame] | 18 | #include <vector> |
kwiberg | 88788ad | 2016-02-19 07:04:49 -0800 | [diff] [blame] | 19 | |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 20 | #include "common_audio/channel_buffer.h" |
| 21 | #include "modules/audio_processing/include/audio_processing.h" |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 22 | |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 23 | namespace webrtc { |
| 24 | |
Yves Gerey | 988cc08 | 2018-10-23 12:03:01 +0200 | [diff] [blame] | 25 | class PushSincResampler; |
| 26 | class SplittingFilter; |
andrew@webrtc.org | ddbb8a2 | 2014-04-22 21:00:04 +0000 | [diff] [blame] | 27 | |
Yves Gerey | 665174f | 2018-06-19 15:03:05 +0200 | [diff] [blame] | 28 | enum Band { kBand0To8kHz = 0, kBand8To16kHz = 1, kBand16To24kHz = 2 }; |
aluebs@webrtc.org | a7384a1 | 2014-12-03 01:06:35 +0000 | [diff] [blame] | 29 | |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 30 | // Stores any audio data in a way that allows the audio processing module to |
| 31 | // operate on it in a controlled manner. |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 32 | class AudioBuffer { |
| 33 | public: |
Per Åhgren | 0aefbf0 | 2019-08-23 21:29:17 +0200 | [diff] [blame] | 34 | static const int kSplitBandSize = 160; |
Sam Zackrisson | 5dd5482 | 2022-11-17 11:26:58 +0100 | [diff] [blame^] | 35 | static const int kMaxSampleRate = 384000; |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 36 | AudioBuffer(size_t input_rate, |
| 37 | size_t input_num_channels, |
| 38 | size_t buffer_rate, |
| 39 | size_t buffer_num_channels, |
| 40 | size_t output_rate, |
| 41 | size_t output_num_channels); |
| 42 | |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 43 | virtual ~AudioBuffer(); |
| 44 | |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 45 | AudioBuffer(const AudioBuffer&) = delete; |
| 46 | AudioBuffer& operator=(const AudioBuffer&) = delete; |
Per Åhgren | 81c0cf2 | 2019-08-21 15:02:37 +0200 | [diff] [blame] | 47 | |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 48 | // Specify that downmixing should be done by selecting a single channel. |
| 49 | void set_downmixing_to_specific_channel(size_t channel); |
| 50 | |
| 51 | // Specify that downmixing should be done by averaging all channels,. |
| 52 | void set_downmixing_by_averaging(); |
| 53 | |
| 54 | // Set the number of channels in the buffer. The specified number of channels |
| 55 | // cannot be larger than the specified buffer_num_channels. The number is also |
| 56 | // reset at each call to CopyFrom or InterleaveFrom. |
| 57 | void set_num_channels(size_t num_channels); |
| 58 | |
| 59 | size_t num_channels() const { return num_channels_; } |
| 60 | size_t num_frames() const { return buffer_num_frames_; } |
| 61 | size_t num_frames_per_band() const { return num_split_frames_; } |
| 62 | size_t num_bands() const { return num_bands_; } |
| 63 | |
| 64 | // Returns pointer arrays to the full-band channels. |
aluebs@webrtc.org | 3aca0b0 | 2015-02-26 21:52:20 +0000 | [diff] [blame] | 65 | // Usage: |
| 66 | // channels()[channel][sample]. |
| 67 | // Where: |
Artem Titov | 0b48930 | 2021-07-28 20:50:03 +0200 | [diff] [blame] | 68 | // 0 <= channel < `buffer_num_channels_` |
| 69 | // 0 <= sample < `buffer_num_frames_` |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 70 | float* const* channels() { return data_->channels(); } |
| 71 | const float* const* channels_const() const { return data_->channels(); } |
aluebs@webrtc.org | 3aca0b0 | 2015-02-26 21:52:20 +0000 | [diff] [blame] | 72 | |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 73 | // Returns pointer arrays to the bands for a specific channel. |
aluebs@webrtc.org | 3aca0b0 | 2015-02-26 21:52:20 +0000 | [diff] [blame] | 74 | // Usage: |
| 75 | // split_bands(channel)[band][sample]. |
| 76 | // Where: |
Artem Titov | 0b48930 | 2021-07-28 20:50:03 +0200 | [diff] [blame] | 77 | // 0 <= channel < `buffer_num_channels_` |
| 78 | // 0 <= band < `num_bands_` |
| 79 | // 0 <= sample < `num_split_frames_` |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 80 | const float* const* split_bands_const(size_t channel) const { |
| 81 | return split_data_.get() ? split_data_->bands(channel) |
| 82 | : data_->bands(channel); |
| 83 | } |
| 84 | float* const* split_bands(size_t channel) { |
| 85 | return split_data_.get() ? split_data_->bands(channel) |
| 86 | : data_->bands(channel); |
| 87 | } |
aluebs@webrtc.org | 3aca0b0 | 2015-02-26 21:52:20 +0000 | [diff] [blame] | 88 | |
| 89 | // Returns a pointer array to the channels for a specific band. |
| 90 | // Usage: |
| 91 | // split_channels(band)[channel][sample]. |
| 92 | // Where: |
Artem Titov | 0b48930 | 2021-07-28 20:50:03 +0200 | [diff] [blame] | 93 | // 0 <= band < `num_bands_` |
| 94 | // 0 <= channel < `buffer_num_channels_` |
| 95 | // 0 <= sample < `num_split_frames_` |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 96 | const float* const* split_channels_const(Band band) const { |
| 97 | if (split_data_.get()) { |
| 98 | return split_data_->channels(band); |
| 99 | } else { |
| 100 | return band == kBand0To8kHz ? data_->channels() : nullptr; |
| 101 | } |
| 102 | } |
andrew@webrtc.org | 755b04a | 2011-11-15 16:57:56 +0000 | [diff] [blame] | 103 | |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 104 | // Copies data into the buffer. |
Per Åhgren | 645f24c | 2020-03-16 12:06:02 +0100 | [diff] [blame] | 105 | void CopyFrom(const int16_t* const interleaved_data, |
| 106 | const StreamConfig& stream_config); |
| 107 | void CopyFrom(const float* const* stacked_data, |
| 108 | const StreamConfig& stream_config); |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 109 | |
| 110 | // Copies data from the buffer. |
Per Åhgren | 645f24c | 2020-03-16 12:06:02 +0100 | [diff] [blame] | 111 | void CopyTo(const StreamConfig& stream_config, |
| 112 | int16_t* const interleaved_data); |
| 113 | void CopyTo(const StreamConfig& stream_config, float* const* stacked_data); |
Gustaf Ullberg | 422b9e0 | 2019-10-09 13:02:14 +0200 | [diff] [blame] | 114 | void CopyTo(AudioBuffer* buffer) const; |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 115 | |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 116 | // Splits the buffer data into frequency bands. |
aluebs@webrtc.org | be05c74 | 2014-11-14 22:18:10 +0000 | [diff] [blame] | 117 | void SplitIntoFrequencyBands(); |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 118 | |
| 119 | // Recombines the frequency bands into a full-band signal. |
aluebs@webrtc.org | be05c74 | 2014-11-14 22:18:10 +0000 | [diff] [blame] | 120 | void MergeFrequencyBands(); |
| 121 | |
Per Åhgren | 928146f | 2019-08-20 09:19:21 +0200 | [diff] [blame] | 122 | // Copies the split bands data into the integer two-dimensional array. |
Per Åhgren | e35b32c | 2019-11-22 18:22:04 +0100 | [diff] [blame] | 123 | void ExportSplitChannelData(size_t channel, |
| 124 | int16_t* const* split_band_data) const; |
Per Åhgren | 928146f | 2019-08-20 09:19:21 +0200 | [diff] [blame] | 125 | |
| 126 | // Copies the data in the integer two-dimensional array into the split_bands |
| 127 | // data. |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 128 | void ImportSplitChannelData(size_t channel, |
| 129 | const int16_t* const* split_band_data); |
Per Åhgren | 928146f | 2019-08-20 09:19:21 +0200 | [diff] [blame] | 130 | |
| 131 | static const size_t kMaxSplitFrameLength = 160; |
| 132 | static const size_t kMaxNumBands = 3; |
| 133 | |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 134 | // Deprecated methods, will be removed soon. |
| 135 | float* const* channels_f() { return channels(); } |
| 136 | const float* const* channels_const_f() const { return channels_const(); } |
| 137 | const float* const* split_bands_const_f(size_t channel) const { |
| 138 | return split_bands_const(channel); |
| 139 | } |
| 140 | float* const* split_bands_f(size_t channel) { return split_bands(channel); } |
| 141 | const float* const* split_channels_const_f(Band band) const { |
| 142 | return split_channels_const(band); |
| 143 | } |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 144 | |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 145 | private: |
Alejandro Luebs | a181c9a | 2016-06-30 15:33:37 -0700 | [diff] [blame] | 146 | FRIEND_TEST_ALL_PREFIXES(AudioBufferTest, |
| 147 | SetNumChannelsSetsChannelBuffersNumChannels); |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 148 | void RestoreNumChannels(); |
andrew@webrtc.org | 17e4064 | 2014-03-04 20:58:13 +0000 | [diff] [blame] | 149 | |
Peter Kasting | dce40cf | 2015-08-24 14:52:23 -0700 | [diff] [blame] | 150 | const size_t input_num_frames_; |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 151 | const size_t input_num_channels_; |
| 152 | const size_t buffer_num_frames_; |
| 153 | const size_t buffer_num_channels_; |
Peter Kasting | dce40cf | 2015-08-24 14:52:23 -0700 | [diff] [blame] | 154 | const size_t output_num_frames_; |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 155 | const size_t output_num_channels_; |
Steve Anton | f254e9e | 2019-08-21 17:52:28 +0000 | [diff] [blame] | 156 | |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 157 | size_t num_channels_; |
Peter Kasting | dce40cf | 2015-08-24 14:52:23 -0700 | [diff] [blame] | 158 | size_t num_bands_; |
| 159 | size_t num_split_frames_; |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 160 | |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 161 | std::unique_ptr<ChannelBuffer<float>> data_; |
| 162 | std::unique_ptr<ChannelBuffer<float>> split_data_; |
kwiberg | 88788ad | 2016-02-19 07:04:49 -0800 | [diff] [blame] | 163 | std::unique_ptr<SplittingFilter> splitting_filter_; |
kwiberg | 4a206a9 | 2016-03-31 10:24:26 -0700 | [diff] [blame] | 164 | std::vector<std::unique_ptr<PushSincResampler>> input_resamplers_; |
| 165 | std::vector<std::unique_ptr<PushSincResampler>> output_resamplers_; |
Per Åhgren | d47941e | 2019-08-22 11:51:13 +0200 | [diff] [blame] | 166 | bool downmix_by_averaging_ = true; |
| 167 | size_t channel_for_downmixing_ = 0; |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 168 | }; |
andrew@webrtc.org | ddbb8a2 | 2014-04-22 21:00:04 +0000 | [diff] [blame] | 169 | |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 170 | } // namespace webrtc |
| 171 | |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 172 | #endif // MODULES_AUDIO_PROCESSING_AUDIO_BUFFER_H_ |