blob: 765cde7fe1d8b9954dec602b2e16e8defdeed613 [file] [log] [blame]
niklase@google.com470e71d2011-07-07 08:21:25 +00001/*
andrew@webrtc.org6f9f8172012-03-06 19:03:39 +00002 * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
niklase@google.com470e71d2011-07-07 08:21:25 +00003 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
pbos@webrtc.org788acd12014-12-15 09:41:24 +000011#ifndef WEBRTC_MODULES_AUDIO_PROCESSING_AUDIO_PROCESSING_IMPL_H_
12#define WEBRTC_MODULES_AUDIO_PROCESSING_AUDIO_PROCESSING_IMPL_H_
niklase@google.com470e71d2011-07-07 08:21:25 +000013
14#include <list>
ajm@google.com808e0e02011-08-03 21:08:51 +000015#include <string>
niklase@google.com470e71d2011-07-07 08:21:25 +000016
kwiberg@webrtc.org00b8f6b2015-02-26 14:34:55 +000017#include "webrtc/base/scoped_ptr.h"
pbos@webrtc.org788acd12014-12-15 09:41:24 +000018#include "webrtc/base/thread_annotations.h"
Michael Graczykdfa36052015-03-25 16:37:27 -070019#include "webrtc/modules/audio_processing/include/audio_processing.h"
niklase@google.com470e71d2011-07-07 08:21:25 +000020
21namespace webrtc {
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +000022
pbos@webrtc.org788acd12014-12-15 09:41:24 +000023class AgcManagerDirect;
niklase@google.com470e71d2011-07-07 08:21:25 +000024class AudioBuffer;
Michael Graczykdfa36052015-03-25 16:37:27 -070025
26template<typename T>
27class Beamformer;
28
ajm@google.com808e0e02011-08-03 21:08:51 +000029class CriticalSectionWrapper;
andrew@webrtc.org56e4a052014-02-27 22:23:17 +000030class EchoCancellationImpl;
niklase@google.com470e71d2011-07-07 08:21:25 +000031class EchoControlMobileImpl;
ajm@google.com808e0e02011-08-03 21:08:51 +000032class FileWrapper;
niklase@google.com470e71d2011-07-07 08:21:25 +000033class GainControlImpl;
pbos@webrtc.org788acd12014-12-15 09:41:24 +000034class GainControlForNewAgc;
niklase@google.com470e71d2011-07-07 08:21:25 +000035class HighPassFilterImpl;
36class LevelEstimatorImpl;
37class NoiseSuppressionImpl;
38class ProcessingComponent;
pbos@webrtc.org788acd12014-12-15 09:41:24 +000039class TransientSuppressor;
niklase@google.com470e71d2011-07-07 08:21:25 +000040class VoiceDetectionImpl;
41
andrew@webrtc.org7bf26462011-12-03 00:03:31 +000042#ifdef WEBRTC_AUDIOPROC_DEBUG_DUMP
43namespace audioproc {
44
45class Event;
46
47} // namespace audioproc
48#endif
49
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +000050class AudioRate {
51 public:
52 explicit AudioRate(int sample_rate_hz)
53 : rate_(sample_rate_hz),
54 samples_per_channel_(AudioProcessing::kChunkSizeMs * rate_ / 1000) {}
55 virtual ~AudioRate() {}
56
57 void set(int rate) {
58 rate_ = rate;
59 samples_per_channel_ = AudioProcessing::kChunkSizeMs * rate_ / 1000;
60 }
61
62 int rate() const { return rate_; }
63 int samples_per_channel() const { return samples_per_channel_; }
64
65 private:
66 int rate_;
67 int samples_per_channel_;
68};
69
70class AudioFormat : public AudioRate {
71 public:
72 AudioFormat(int sample_rate_hz, int num_channels)
73 : AudioRate(sample_rate_hz),
74 num_channels_(num_channels) {}
75 virtual ~AudioFormat() {}
76
77 void set(int rate, int num_channels) {
78 AudioRate::set(rate);
79 num_channels_ = num_channels;
80 }
81
82 int num_channels() const { return num_channels_; }
83
84 private:
85 int num_channels_;
86};
87
niklase@google.com470e71d2011-07-07 08:21:25 +000088class AudioProcessingImpl : public AudioProcessing {
89 public:
andrew@webrtc.orge84978f2014-01-25 02:09:06 +000090 explicit AudioProcessingImpl(const Config& config);
Michael Graczykdfa36052015-03-25 16:37:27 -070091
92 // AudioProcessingImpl takes ownership of beamformer.
93 AudioProcessingImpl(const Config& config, Beamformer<float>* beamformer);
niklase@google.com470e71d2011-07-07 08:21:25 +000094 virtual ~AudioProcessingImpl();
95
niklase@google.com470e71d2011-07-07 08:21:25 +000096 // AudioProcessing methods.
kjellander@webrtc.org14665ff2015-03-04 12:58:35 +000097 int Initialize() override;
98 int Initialize(int input_sample_rate_hz,
99 int output_sample_rate_hz,
100 int reverse_sample_rate_hz,
101 ChannelLayout input_layout,
102 ChannelLayout output_layout,
103 ChannelLayout reverse_layout) override;
104 void SetExtraOptions(const Config& config) override;
105 int set_sample_rate_hz(int rate) override;
106 int input_sample_rate_hz() const override;
107 int sample_rate_hz() const override;
108 int proc_sample_rate_hz() const override;
109 int proc_split_sample_rate_hz() const override;
110 int num_input_channels() const override;
111 int num_output_channels() const override;
112 int num_reverse_channels() const override;
113 void set_output_will_be_muted(bool muted) override;
114 bool output_will_be_muted() const override;
115 int ProcessStream(AudioFrame* frame) override;
116 int ProcessStream(const float* const* src,
117 int samples_per_channel,
118 int input_sample_rate_hz,
119 ChannelLayout input_layout,
120 int output_sample_rate_hz,
121 ChannelLayout output_layout,
122 float* const* dest) override;
123 int AnalyzeReverseStream(AudioFrame* frame) override;
124 int AnalyzeReverseStream(const float* const* data,
125 int samples_per_channel,
126 int sample_rate_hz,
127 ChannelLayout layout) override;
128 int set_stream_delay_ms(int delay) override;
129 int stream_delay_ms() const override;
130 bool was_stream_delay_set() const override;
131 void set_delay_offset_ms(int offset) override;
132 int delay_offset_ms() const override;
133 void set_stream_key_pressed(bool key_pressed) override;
134 bool stream_key_pressed() const override;
135 int StartDebugRecording(const char filename[kMaxFilenameSize]) override;
136 int StartDebugRecording(FILE* handle) override;
137 int StartDebugRecordingForPlatformFile(rtc::PlatformFile handle) override;
138 int StopDebugRecording() override;
139 EchoCancellation* echo_cancellation() const override;
140 EchoControlMobile* echo_control_mobile() const override;
141 GainControl* gain_control() const override;
142 HighPassFilter* high_pass_filter() const override;
143 LevelEstimator* level_estimator() const override;
144 NoiseSuppression* noise_suppression() const override;
145 VoiceDetection* voice_detection() const override;
niklase@google.com470e71d2011-07-07 08:21:25 +0000146
andrew@webrtc.org60730cf2014-01-07 17:45:09 +0000147 protected:
andrew@webrtc.orga8b97372014-03-10 22:26:12 +0000148 // Overridden in a mock.
pbos@webrtc.org788acd12014-12-15 09:41:24 +0000149 virtual int InitializeLocked() EXCLUSIVE_LOCKS_REQUIRED(crit_);
andrew@webrtc.org60730cf2014-01-07 17:45:09 +0000150
niklase@google.com470e71d2011-07-07 08:21:25 +0000151 private:
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +0000152 int InitializeLocked(int input_sample_rate_hz,
153 int output_sample_rate_hz,
andrew@webrtc.orga8b97372014-03-10 22:26:12 +0000154 int reverse_sample_rate_hz,
155 int num_input_channels,
156 int num_output_channels,
pbos@webrtc.org788acd12014-12-15 09:41:24 +0000157 int num_reverse_channels)
158 EXCLUSIVE_LOCKS_REQUIRED(crit_);
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +0000159 int MaybeInitializeLocked(int input_sample_rate_hz,
160 int output_sample_rate_hz,
andrew@webrtc.orga8b97372014-03-10 22:26:12 +0000161 int reverse_sample_rate_hz,
162 int num_input_channels,
163 int num_output_channels,
pbos@webrtc.org788acd12014-12-15 09:41:24 +0000164 int num_reverse_channels)
165 EXCLUSIVE_LOCKS_REQUIRED(crit_);
166 int ProcessStreamLocked() EXCLUSIVE_LOCKS_REQUIRED(crit_);
167 int AnalyzeReverseStreamLocked() EXCLUSIVE_LOCKS_REQUIRED(crit_);
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000168
andrew@webrtc.org369166a2012-04-24 18:38:03 +0000169 bool is_data_processed() const;
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000170 bool output_copy_needed(bool is_data_processed) const;
andrew@webrtc.org369166a2012-04-24 18:38:03 +0000171 bool synthesis_needed(bool is_data_processed) const;
172 bool analysis_needed(bool is_data_processed) const;
pbos@webrtc.org788acd12014-12-15 09:41:24 +0000173 int InitializeExperimentalAgc() EXCLUSIVE_LOCKS_REQUIRED(crit_);
174 int InitializeTransient() EXCLUSIVE_LOCKS_REQUIRED(crit_);
aluebs@webrtc.orgae643ce2014-12-19 19:57:34 +0000175 void InitializeBeamformer() EXCLUSIVE_LOCKS_REQUIRED(crit_);
ajm@google.com808e0e02011-08-03 21:08:51 +0000176
andrew@webrtc.org56e4a052014-02-27 22:23:17 +0000177 EchoCancellationImpl* echo_cancellation_;
niklase@google.com470e71d2011-07-07 08:21:25 +0000178 EchoControlMobileImpl* echo_control_mobile_;
179 GainControlImpl* gain_control_;
180 HighPassFilterImpl* high_pass_filter_;
181 LevelEstimatorImpl* level_estimator_;
182 NoiseSuppressionImpl* noise_suppression_;
183 VoiceDetectionImpl* voice_detection_;
kwiberg@webrtc.org00b8f6b2015-02-26 14:34:55 +0000184 rtc::scoped_ptr<GainControlForNewAgc> gain_control_for_new_agc_;
niklase@google.com470e71d2011-07-07 08:21:25 +0000185
186 std::list<ProcessingComponent*> component_list_;
niklase@google.com470e71d2011-07-07 08:21:25 +0000187 CriticalSectionWrapper* crit_;
kwiberg@webrtc.org00b8f6b2015-02-26 14:34:55 +0000188 rtc::scoped_ptr<AudioBuffer> render_audio_;
189 rtc::scoped_ptr<AudioBuffer> capture_audio_;
andrew@webrtc.org7bf26462011-12-03 00:03:31 +0000190#ifdef WEBRTC_AUDIOPROC_DEBUG_DUMP
191 // TODO(andrew): make this more graceful. Ideally we would split this stuff
192 // out into a separate class with an "enabled" and "disabled" implementation.
193 int WriteMessageToDebugFile();
194 int WriteInitMessage();
kwiberg@webrtc.org00b8f6b2015-02-26 14:34:55 +0000195 rtc::scoped_ptr<FileWrapper> debug_file_;
196 rtc::scoped_ptr<audioproc::Event> event_msg_; // Protobuf message.
andrew@webrtc.org60730cf2014-01-07 17:45:09 +0000197 std::string event_str_; // Memory for protobuf serialization.
andrew@webrtc.org7bf26462011-12-03 00:03:31 +0000198#endif
niklase@google.com470e71d2011-07-07 08:21:25 +0000199
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +0000200 AudioFormat fwd_in_format_;
aluebs@webrtc.org27d106b2014-12-11 17:09:21 +0000201 // This one is an AudioRate, because the forward processing number of channels
202 // is mutable and is tracked by the capture_audio_.
203 AudioRate fwd_proc_format_;
204 AudioFormat fwd_out_format_;
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +0000205 AudioFormat rev_in_format_;
206 AudioFormat rev_proc_format_;
207 int split_rate_;
208
niklase@google.com470e71d2011-07-07 08:21:25 +0000209 int stream_delay_ms_;
andrew@webrtc.org6f9f8172012-03-06 19:03:39 +0000210 int delay_offset_ms_;
niklase@google.com470e71d2011-07-07 08:21:25 +0000211 bool was_stream_delay_set_;
212
andrew@webrtc.org17342e52014-02-12 22:28:31 +0000213 bool output_will_be_muted_;
andrew@webrtc.org75dd2882014-02-11 20:52:30 +0000214
215 bool key_pressed_;
pbos@webrtc.org788acd12014-12-15 09:41:24 +0000216
217 // Only set through the constructor's Config parameter.
218 const bool use_new_agc_;
kwiberg@webrtc.org00b8f6b2015-02-26 14:34:55 +0000219 rtc::scoped_ptr<AgcManagerDirect> agc_manager_ GUARDED_BY(crit_);
pbos@webrtc.org788acd12014-12-15 09:41:24 +0000220
221 bool transient_suppressor_enabled_;
kwiberg@webrtc.org00b8f6b2015-02-26 14:34:55 +0000222 rtc::scoped_ptr<TransientSuppressor> transient_suppressor_;
aluebs@webrtc.orgae643ce2014-12-19 19:57:34 +0000223 const bool beamformer_enabled_;
Michael Graczykdfa36052015-03-25 16:37:27 -0700224 rtc::scoped_ptr<Beamformer<float>> beamformer_;
aluebs@webrtc.orgfb7a0392015-01-05 21:58:58 +0000225 const std::vector<Point> array_geometry_;
aluebs@webrtc.orgc9ce07e2015-03-02 20:07:31 +0000226
227 const bool supports_48kHz_;
niklase@google.com470e71d2011-07-07 08:21:25 +0000228};
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +0000229
niklase@google.com470e71d2011-07-07 08:21:25 +0000230} // namespace webrtc
231
pbos@webrtc.org788acd12014-12-15 09:41:24 +0000232#endif // WEBRTC_MODULES_AUDIO_PROCESSING_AUDIO_PROCESSING_IMPL_H_