blob: ade3eec13db2a17377d4cebf074ba772ccfac55a [file] [log] [blame]
niklase@google.com470e71d2011-07-07 08:21:25 +00001/*
2 * Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020011#ifndef MODULES_AUDIO_PROCESSING_AUDIO_BUFFER_H_
12#define MODULES_AUDIO_PROCESSING_AUDIO_BUFFER_H_
niklase@google.com470e71d2011-07-07 08:21:25 +000013
kwiberg88788ad2016-02-19 07:04:49 -080014#include <memory>
kwiberg4a206a92016-03-31 10:24:26 -070015#include <vector>
kwiberg88788ad2016-02-19 07:04:49 -080016
Fredrik Solenbergbbf21a32018-04-12 22:44:09 +020017#include "api/audio/audio_frame.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020018#include "common_audio/channel_buffer.h"
19#include "modules/audio_processing/include/audio_processing.h"
20#include "modules/audio_processing/splitting_filter.h"
niklase@google.com470e71d2011-07-07 08:21:25 +000021
niklase@google.com470e71d2011-07-07 08:21:25 +000022namespace webrtc {
23
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +000024class PushSincResampler;
mflodman@webrtc.orgd5da2502014-05-15 11:17:21 +000025class IFChannelBuffer;
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +000026
Yves Gerey665174f2018-06-19 15:03:05 +020027enum Band { kBand0To8kHz = 0, kBand8To16kHz = 1, kBand16To24kHz = 2 };
aluebs@webrtc.orga7384a12014-12-03 01:06:35 +000028
niklase@google.com470e71d2011-07-07 08:21:25 +000029class AudioBuffer {
30 public:
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +000031 // TODO(ajm): Switch to take ChannelLayouts.
Peter Kastingdce40cf2015-08-24 14:52:23 -070032 AudioBuffer(size_t input_num_frames,
Peter Kasting69558702016-01-12 16:26:35 -080033 size_t num_input_channels,
Peter Kastingdce40cf2015-08-24 14:52:23 -070034 size_t process_num_frames,
Peter Kasting69558702016-01-12 16:26:35 -080035 size_t num_process_channels,
Peter Kastingdce40cf2015-08-24 14:52:23 -070036 size_t output_num_frames);
niklase@google.com470e71d2011-07-07 08:21:25 +000037 virtual ~AudioBuffer();
38
Peter Kasting69558702016-01-12 16:26:35 -080039 size_t num_channels() const;
40 void set_num_channels(size_t num_channels);
Peter Kastingdce40cf2015-08-24 14:52:23 -070041 size_t num_frames() const;
42 size_t num_frames_per_band() const;
43 size_t num_keyboard_frames() const;
44 size_t num_bands() const;
niklase@google.com470e71d2011-07-07 08:21:25 +000045
aluebs@webrtc.org3aca0b02015-02-26 21:52:20 +000046 // Returns a pointer array to the full-band channels.
47 // Usage:
48 // channels()[channel][sample].
49 // Where:
50 // 0 <= channel < |num_proc_channels_|
51 // 0 <= sample < |proc_num_frames_|
aluebs@webrtc.orgbe05c742014-11-14 22:18:10 +000052 int16_t* const* channels();
aluebs@webrtc.orga7384a12014-12-03 01:06:35 +000053 const int16_t* const* channels_const() const;
aluebs@webrtc.org3aca0b02015-02-26 21:52:20 +000054 float* const* channels_f();
55 const float* const* channels_const_f() const;
56
57 // Returns a pointer array to the bands for a specific channel.
58 // Usage:
59 // split_bands(channel)[band][sample].
60 // Where:
61 // 0 <= channel < |num_proc_channels_|
62 // 0 <= band < |num_bands_|
63 // 0 <= sample < |num_split_frames_|
Peter Kasting69558702016-01-12 16:26:35 -080064 int16_t* const* split_bands(size_t channel);
65 const int16_t* const* split_bands_const(size_t channel) const;
66 float* const* split_bands_f(size_t channel);
67 const float* const* split_bands_const_f(size_t channel) const;
aluebs@webrtc.org3aca0b02015-02-26 21:52:20 +000068
69 // Returns a pointer array to the channels for a specific band.
70 // Usage:
71 // split_channels(band)[channel][sample].
72 // Where:
73 // 0 <= band < |num_bands_|
74 // 0 <= channel < |num_proc_channels_|
75 // 0 <= sample < |num_split_frames_|
aluebs@webrtc.orga7384a12014-12-03 01:06:35 +000076 int16_t* const* split_channels(Band band);
77 const int16_t* const* split_channels_const(Band band) const;
aluebs@webrtc.org3aca0b02015-02-26 21:52:20 +000078 float* const* split_channels_f(Band band);
79 const float* const* split_channels_const_f(Band band) const;
80
81 // Returns a pointer to the ChannelBuffer that encapsulates the full-band
82 // data.
83 ChannelBuffer<int16_t>* data();
84 const ChannelBuffer<int16_t>* data() const;
85 ChannelBuffer<float>* data_f();
86 const ChannelBuffer<float>* data_f() const;
87
88 // Returns a pointer to the ChannelBuffer that encapsulates the split data.
89 ChannelBuffer<int16_t>* split_data();
90 const ChannelBuffer<int16_t>* split_data() const;
91 ChannelBuffer<float>* split_data_f();
92 const ChannelBuffer<float>* split_data_f() const;
aluebs@webrtc.orga7384a12014-12-03 01:06:35 +000093
aluebs@webrtc.org2561d522014-07-17 08:27:39 +000094 // Returns a pointer to the low-pass data downmixed to mono. If this data
95 // isn't already available it re-calculates it.
96 const int16_t* mixed_low_pass_data();
andrew@webrtc.org65f93382014-04-30 16:44:13 +000097 const int16_t* low_pass_reference(int channel) const;
mflodman@webrtc.orgd5da2502014-05-15 11:17:21 +000098
andrew@webrtc.org103657b2014-04-24 18:28:56 +000099 const float* keyboard_data() const;
niklase@google.com470e71d2011-07-07 08:21:25 +0000100
andrew@webrtc.orged083d42011-09-19 15:28:51 +0000101 void set_activity(AudioFrame::VADActivity activity);
andrew@webrtc.org755b04a2011-11-15 16:57:56 +0000102 AudioFrame::VADActivity activity() const;
103
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000104 // Use for int16 interleaved data.
niklase@google.com470e71d2011-07-07 08:21:25 +0000105 void DeinterleaveFrom(AudioFrame* audioFrame);
andrew@webrtc.org755b04a2011-11-15 16:57:56 +0000106 // If |data_changed| is false, only the non-audio data members will be copied
107 // to |frame|.
kthelgasonc7daea82017-03-14 03:10:07 -0700108 void InterleaveTo(AudioFrame* frame, bool data_changed) const;
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000109
110 // Use for float deinterleaved data.
Michael Graczyk86c6d332015-07-23 11:41:39 -0700111 void CopyFrom(const float* const* data, const StreamConfig& stream_config);
112 void CopyTo(const StreamConfig& stream_config, float* const* data);
niklase@google.com470e71d2011-07-07 08:21:25 +0000113 void CopyLowPassToReference();
114
aluebs@webrtc.orgbe05c742014-11-14 22:18:10 +0000115 // Splits the signal into different bands.
116 void SplitIntoFrequencyBands();
117 // Recombine the different bands into one signal.
118 void MergeFrequencyBands();
119
niklase@google.com470e71d2011-07-07 08:21:25 +0000120 private:
Alejandro Luebsa181c9a2016-06-30 15:33:37 -0700121 FRIEND_TEST_ALL_PREFIXES(AudioBufferTest,
122 SetNumChannelsSetsChannelBuffersNumChannels);
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000123 // Called from DeinterleaveFrom() and CopyFrom().
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +0000124 void InitForNewData();
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000125
aluebs@webrtc.org27d106b2014-12-11 17:09:21 +0000126 // The audio is passed into DeinterleaveFrom() or CopyFrom() with input
127 // format (samples per channel and number of channels).
Peter Kastingdce40cf2015-08-24 14:52:23 -0700128 const size_t input_num_frames_;
Peter Kasting69558702016-01-12 16:26:35 -0800129 const size_t num_input_channels_;
aluebs@webrtc.org27d106b2014-12-11 17:09:21 +0000130 // The audio is stored by DeinterleaveFrom() or CopyFrom() with processing
131 // format.
Peter Kastingdce40cf2015-08-24 14:52:23 -0700132 const size_t proc_num_frames_;
Peter Kasting69558702016-01-12 16:26:35 -0800133 const size_t num_proc_channels_;
aluebs@webrtc.org27d106b2014-12-11 17:09:21 +0000134 // The audio is returned by InterleaveTo() and CopyTo() with output samples
135 // per channels and the current number of channels. This last one can be
136 // changed at any time using set_num_channels().
Peter Kastingdce40cf2015-08-24 14:52:23 -0700137 const size_t output_num_frames_;
Peter Kasting69558702016-01-12 16:26:35 -0800138 size_t num_channels_;
aluebs@webrtc.org27d106b2014-12-11 17:09:21 +0000139
Peter Kastingdce40cf2015-08-24 14:52:23 -0700140 size_t num_bands_;
141 size_t num_split_frames_;
aluebs@webrtc.org2561d522014-07-17 08:27:39 +0000142 bool mixed_low_pass_valid_;
niklase@google.com470e71d2011-07-07 08:21:25 +0000143 bool reference_copied_;
andrew@webrtc.orged083d42011-09-19 15:28:51 +0000144 AudioFrame::VADActivity activity_;
niklase@google.com470e71d2011-07-07 08:21:25 +0000145
andrew@webrtc.org103657b2014-04-24 18:28:56 +0000146 const float* keyboard_data_;
kwiberg88788ad2016-02-19 07:04:49 -0800147 std::unique_ptr<IFChannelBuffer> data_;
148 std::unique_ptr<IFChannelBuffer> split_data_;
149 std::unique_ptr<SplittingFilter> splitting_filter_;
Yves Gerey665174f2018-06-19 15:03:05 +0200150 std::unique_ptr<ChannelBuffer<int16_t>> mixed_low_pass_channels_;
151 std::unique_ptr<ChannelBuffer<int16_t>> low_pass_reference_channels_;
kwiberg88788ad2016-02-19 07:04:49 -0800152 std::unique_ptr<IFChannelBuffer> input_buffer_;
153 std::unique_ptr<IFChannelBuffer> output_buffer_;
Yves Gerey665174f2018-06-19 15:03:05 +0200154 std::unique_ptr<ChannelBuffer<float>> process_buffer_;
kwiberg4a206a92016-03-31 10:24:26 -0700155 std::vector<std::unique_ptr<PushSincResampler>> input_resamplers_;
156 std::vector<std::unique_ptr<PushSincResampler>> output_resamplers_;
niklase@google.com470e71d2011-07-07 08:21:25 +0000157};
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +0000158
niklase@google.com470e71d2011-07-07 08:21:25 +0000159} // namespace webrtc
160
Mirko Bonadei92ea95e2017-09-15 06:47:31 +0200161#endif // MODULES_AUDIO_PROCESSING_AUDIO_BUFFER_H_