blob: 3e1b4661221dabeab90717ec1b46bbd2643324f9 [file] [log] [blame]
niklase@google.com470e71d2011-07-07 08:21:25 +00001/*
andrew@webrtc.org6f9f8172012-03-06 19:03:39 +00002 * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
niklase@google.com470e71d2011-07-07 08:21:25 +00003 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020011#ifndef MODULES_AUDIO_PROCESSING_AUDIO_PROCESSING_IMPL_H_
12#define MODULES_AUDIO_PROCESSING_AUDIO_PROCESSING_IMPL_H_
niklase@google.com470e71d2011-07-07 08:21:25 +000013
14#include <list>
kwiberg88788ad2016-02-19 07:04:49 -080015#include <memory>
Michael Graczyk86c6d332015-07-23 11:41:39 -070016#include <vector>
niklase@google.com470e71d2011-07-07 08:21:25 +000017
Artem Titov741daaf2019-03-21 14:37:36 +010018#include "api/function_view.h"
saza1d600522019-10-18 13:29:43 +020019#include "modules/audio_processing/aec3/echo_canceller3.h"
20#include "modules/audio_processing/agc/agc_manager_direct.h"
Sam Zackrisson41478c72019-10-15 10:10:26 +020021#include "modules/audio_processing/agc/gain_control.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020022#include "modules/audio_processing/audio_buffer.h"
saza1d600522019-10-18 13:29:43 +020023#include "modules/audio_processing/echo_cancellation_impl.h"
24#include "modules/audio_processing/echo_control_mobile_impl.h"
25#include "modules/audio_processing/gain_control_for_experimental_agc.h"
26#include "modules/audio_processing/gain_control_impl.h"
27#include "modules/audio_processing/gain_controller2.h"
28#include "modules/audio_processing/high_pass_filter.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020029#include "modules/audio_processing/include/aec_dump.h"
30#include "modules/audio_processing/include/audio_processing.h"
Sam Zackrissonb24c00f2018-11-26 16:18:25 +010031#include "modules/audio_processing/include/audio_processing_statistics.h"
Per Åhgren87a7b822019-10-29 22:59:44 +010032#include "modules/audio_processing/legacy_noise_suppression.h"
saza1d600522019-10-18 13:29:43 +020033#include "modules/audio_processing/level_estimator.h"
Per Åhgren87a7b822019-10-29 22:59:44 +010034#include "modules/audio_processing/ns/noise_suppressor.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020035#include "modules/audio_processing/render_queue_item_verifier.h"
saza1d600522019-10-18 13:29:43 +020036#include "modules/audio_processing/residual_echo_detector.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020037#include "modules/audio_processing/rms_level.h"
saza1d600522019-10-18 13:29:43 +020038#include "modules/audio_processing/transient/transient_suppressor.h"
39#include "modules/audio_processing/voice_detection.h"
Steve Anton10542f22019-01-11 09:11:00 -080040#include "rtc_base/critical_section.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020041#include "rtc_base/gtest_prod_util.h"
42#include "rtc_base/ignore_wundef.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020043#include "rtc_base/swap_queue.h"
44#include "rtc_base/thread_annotations.h"
peahdf3efa82015-11-28 12:35:15 -080045
niklase@google.com470e71d2011-07-07 08:21:25 +000046namespace webrtc {
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +000047
Per Åhgren13735822018-02-12 21:42:56 +010048class ApmDataDumper;
ekmeyerson60d9b332015-08-14 10:35:55 -070049class AudioConverter;
Michael Graczykdfa36052015-03-25 16:37:27 -070050
niklase@google.com470e71d2011-07-07 08:21:25 +000051class AudioProcessingImpl : public AudioProcessing {
52 public:
peahdf3efa82015-11-28 12:35:15 -080053 // Methods forcing APM to run in a single-threaded manner.
54 // Acquires both the render and capture locks.
peah88ac8532016-09-12 16:47:25 -070055 explicit AudioProcessingImpl(const webrtc::Config& config);
Sam Zackrissondb389722018-06-21 10:12:24 +020056 // AudioProcessingImpl takes ownership of capture post processor.
peah88ac8532016-09-12 16:47:25 -070057 AudioProcessingImpl(const webrtc::Config& config,
Alex Loiko5825aa62017-12-18 16:02:40 +010058 std::unique_ptr<CustomProcessing> capture_post_processor,
59 std::unique_ptr<CustomProcessing> render_pre_processor,
Gustaf Ullberg002ef282017-10-12 15:13:17 +020060 std::unique_ptr<EchoControlFactory> echo_control_factory,
Valeriia Nemychnikovaf06eb572018-08-29 10:37:09 +020061 rtc::scoped_refptr<EchoDetector> echo_detector,
62 std::unique_ptr<CustomAudioAnalyzer> capture_analyzer);
kwiberg83ffe452016-08-29 14:46:07 -070063 ~AudioProcessingImpl() override;
kjellander@webrtc.org14665ff2015-03-04 12:58:35 +000064 int Initialize() override;
peahde65ddc2016-09-16 15:02:15 -070065 int Initialize(int capture_input_sample_rate_hz,
66 int capture_output_sample_rate_hz,
67 int render_sample_rate_hz,
68 ChannelLayout capture_input_layout,
69 ChannelLayout capture_output_layout,
70 ChannelLayout render_input_layout) override;
Michael Graczyk86c6d332015-07-23 11:41:39 -070071 int Initialize(const ProcessingConfig& processing_config) override;
peah88ac8532016-09-12 16:47:25 -070072 void ApplyConfig(const AudioProcessing::Config& config) override;
73 void SetExtraOptions(const webrtc::Config& config) override;
peahdf3efa82015-11-28 12:35:15 -080074 void UpdateHistogramsOnCallEnd() override;
aleloi868f32f2017-05-23 07:20:05 -070075 void AttachAecDump(std::unique_ptr<AecDump> aec_dump) override;
76 void DetachAecDump() override;
Sam Zackrisson4d364492018-03-02 16:03:21 +010077 void AttachPlayoutAudioGenerator(
78 std::unique_ptr<AudioGenerator> audio_generator) override;
79 void DetachPlayoutAudioGenerator() override;
peahdf3efa82015-11-28 12:35:15 -080080
Alessio Bazzicac054e782018-04-16 12:10:09 +020081 void SetRuntimeSetting(RuntimeSetting setting) override;
82
peahdf3efa82015-11-28 12:35:15 -080083 // Capture-side exclusive methods possibly running APM in a
84 // multi-threaded manner. Acquire the capture lock.
kjellander@webrtc.org14665ff2015-03-04 12:58:35 +000085 int ProcessStream(AudioFrame* frame) override;
86 int ProcessStream(const float* const* src,
Michael Graczyk86c6d332015-07-23 11:41:39 -070087 const StreamConfig& input_config,
88 const StreamConfig& output_config,
89 float* const* dest) override;
peahdf3efa82015-11-28 12:35:15 -080090 void set_output_will_be_muted(bool muted) override;
91 int set_stream_delay_ms(int delay) override;
92 void set_delay_offset_ms(int offset) override;
93 int delay_offset_ms() const override;
94 void set_stream_key_pressed(bool key_pressed) override;
Sam Zackrissonf0d1c032019-03-27 13:28:08 +010095 void set_stream_analog_level(int level) override;
96 int recommended_stream_analog_level() const override;
peahdf3efa82015-11-28 12:35:15 -080097
98 // Render-side exclusive methods possibly running APM in a
99 // multi-threaded manner. Acquire the render lock.
ekmeyerson60d9b332015-08-14 10:35:55 -0700100 int ProcessReverseStream(AudioFrame* frame) override;
kjellander@webrtc.org14665ff2015-03-04 12:58:35 +0000101 int AnalyzeReverseStream(const float* const* data,
Gustaf Ullberg8c51f2e2019-10-22 15:21:31 +0200102 const StreamConfig& reverse_config) override;
ekmeyerson60d9b332015-08-14 10:35:55 -0700103 int ProcessReverseStream(const float* const* src,
peahde65ddc2016-09-16 15:02:15 -0700104 const StreamConfig& input_config,
105 const StreamConfig& output_config,
ekmeyerson60d9b332015-08-14 10:35:55 -0700106 float* const* dest) override;
peahdf3efa82015-11-28 12:35:15 -0800107
108 // Methods only accessed from APM submodules or
109 // from AudioProcessing tests in a single-threaded manner.
110 // Hence there is no need for locks in these.
111 int proc_sample_rate_hz() const override;
112 int proc_split_sample_rate_hz() const override;
Peter Kasting69558702016-01-12 16:26:35 -0800113 size_t num_input_channels() const override;
114 size_t num_proc_channels() const override;
115 size_t num_output_channels() const override;
116 size_t num_reverse_channels() const override;
kjellander@webrtc.org14665ff2015-03-04 12:58:35 +0000117 int stream_delay_ms() const override;
peahdf3efa82015-11-28 12:35:15 -0800118 bool was_stream_delay_set() const override
danilchap56359be2017-09-07 07:53:45 -0700119 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_capture_);
peahdf3efa82015-11-28 12:35:15 -0800120
Ivo Creusenae026092017-11-20 13:07:16 +0100121 AudioProcessingStats GetStatistics(bool has_remote_tracks) const override;
ivoc3e9a5372016-10-28 07:55:33 -0700122
henrik.lundinadf06352017-04-05 05:48:24 -0700123 // TODO(peah): Remove MutateConfig once the new API allows that.
peah8271d042016-11-22 07:24:52 -0800124 void MutateConfig(rtc::FunctionView<void(AudioProcessing::Config*)> mutator);
henrik.lundinadf06352017-04-05 05:48:24 -0700125 AudioProcessing::Config GetConfig() const override;
peah8271d042016-11-22 07:24:52 -0800126
andrew@webrtc.org60730cf2014-01-07 17:45:09 +0000127 protected:
andrew@webrtc.orga8b97372014-03-10 22:26:12 +0000128 // Overridden in a mock.
peahdf3efa82015-11-28 12:35:15 -0800129 virtual int InitializeLocked()
danilchap56359be2017-09-07 07:53:45 -0700130 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_render_, crit_capture_);
andrew@webrtc.org60730cf2014-01-07 17:45:09 +0000131
niklase@google.com470e71d2011-07-07 08:21:25 +0000132 private:
peahc19f3122016-10-07 14:54:10 -0700133 // TODO(peah): These friend classes should be removed as soon as the new
134 // parameter setting scheme allows.
135 FRIEND_TEST_ALL_PREFIXES(ApmConfiguration, DefaultBehavior);
136 FRIEND_TEST_ALL_PREFIXES(ApmConfiguration, ValidConfigBehavior);
137 FRIEND_TEST_ALL_PREFIXES(ApmConfiguration, InValidConfigBehavior);
Alessio Bazzicac054e782018-04-16 12:10:09 +0200138
139 // Class providing thread-safe message pipe functionality for
140 // |runtime_settings_|.
141 class RuntimeSettingEnqueuer {
142 public:
143 explicit RuntimeSettingEnqueuer(
144 SwapQueue<RuntimeSetting>* runtime_settings);
145 ~RuntimeSettingEnqueuer();
146 void Enqueue(RuntimeSetting setting);
147
148 private:
Alessio Bazzica33444dc2018-04-20 13:16:55 +0200149 SwapQueue<RuntimeSetting>& runtime_settings_;
Alex Loiko73ec0192018-05-15 10:52:28 +0200150 };
Alex Loiko73ec0192018-05-15 10:52:28 +0200151
152 std::unique_ptr<ApmDataDumper> data_dumper_;
153 static int instance_count_;
Per Åhgren87a7b822019-10-29 22:59:44 +0100154 const bool enforced_usage_of_legacy_ns_;
Alex Loiko73ec0192018-05-15 10:52:28 +0200155
156 SwapQueue<RuntimeSetting> capture_runtime_settings_;
157 SwapQueue<RuntimeSetting> render_runtime_settings_;
158
159 RuntimeSettingEnqueuer capture_runtime_settings_enqueuer_;
160 RuntimeSettingEnqueuer render_runtime_settings_enqueuer_;
Alessio Bazzicac054e782018-04-16 12:10:09 +0200161
Gustaf Ullberg002ef282017-10-12 15:13:17 +0200162 // EchoControl factory.
163 std::unique_ptr<EchoControlFactory> echo_control_factory_;
Gustaf Ullbergd8579e02017-10-11 16:29:02 +0200164
saza1d600522019-10-18 13:29:43 +0200165 class SubmoduleStates {
peah2ace3f92016-09-10 04:42:27 -0700166 public:
saza1d600522019-10-18 13:29:43 +0200167 SubmoduleStates(bool capture_post_processor_enabled,
168 bool render_pre_processor_enabled,
169 bool capture_analyzer_enabled);
peah2ace3f92016-09-10 04:42:27 -0700170 // Updates the submodule state and returns true if it has changed.
Sam Zackrissoncb1b5562018-09-28 14:15:09 +0200171 bool Update(bool high_pass_filter_enabled,
peah2ace3f92016-09-10 04:42:27 -0700172 bool echo_canceller_enabled,
173 bool mobile_echo_controller_enabled,
ivoc9f4a4a02016-10-28 05:39:16 -0700174 bool residual_echo_detector_enabled,
peah2ace3f92016-09-10 04:42:27 -0700175 bool noise_suppressor_enabled,
peah2ace3f92016-09-10 04:42:27 -0700176 bool adaptive_gain_controller_enabled,
alessiob3ec96df2017-05-22 06:57:06 -0700177 bool gain_controller2_enabled,
Alex Loikob5c9a792018-04-16 16:31:22 +0200178 bool pre_amplifier_enabled,
Gustaf Ullbergce045ac2017-10-16 13:49:04 +0200179 bool echo_controller_enabled,
Sam Zackrisson0824c6f2019-10-07 14:03:56 +0200180 bool voice_detector_enabled,
peah2ace3f92016-09-10 04:42:27 -0700181 bool transient_suppressor_enabled);
182 bool CaptureMultiBandSubModulesActive() const;
Gustaf Ullberg8675eee2019-10-09 13:34:36 +0200183 bool CaptureMultiBandProcessingPresent() const;
184 bool CaptureMultiBandProcessingActive(bool ec_processing_active) const;
peah23ac8b42017-05-23 05:33:56 -0700185 bool CaptureFullBandProcessingActive() const;
Valeriia Nemychnikovaf06eb572018-08-29 10:37:09 +0200186 bool CaptureAnalyzerActive() const;
peah2ace3f92016-09-10 04:42:27 -0700187 bool RenderMultiBandSubModulesActive() const;
Alex Loiko5825aa62017-12-18 16:02:40 +0100188 bool RenderFullBandProcessingActive() const;
peah2ace3f92016-09-10 04:42:27 -0700189 bool RenderMultiBandProcessingActive() const;
Per Åhgren0aefbf02019-08-23 21:29:17 +0200190 bool HighPassFilteringRequired() const;
peah2ace3f92016-09-10 04:42:27 -0700191
192 private:
Sam Zackrisson0beac582017-09-25 12:04:02 +0200193 const bool capture_post_processor_enabled_ = false;
Alex Loiko5825aa62017-12-18 16:02:40 +0100194 const bool render_pre_processor_enabled_ = false;
Valeriia Nemychnikovaf06eb572018-08-29 10:37:09 +0200195 const bool capture_analyzer_enabled_ = false;
Sam Zackrissoncb1b5562018-09-28 14:15:09 +0200196 bool high_pass_filter_enabled_ = false;
peah2ace3f92016-09-10 04:42:27 -0700197 bool echo_canceller_enabled_ = false;
198 bool mobile_echo_controller_enabled_ = false;
ivoc9f4a4a02016-10-28 05:39:16 -0700199 bool residual_echo_detector_enabled_ = false;
peah2ace3f92016-09-10 04:42:27 -0700200 bool noise_suppressor_enabled_ = false;
peah2ace3f92016-09-10 04:42:27 -0700201 bool adaptive_gain_controller_enabled_ = false;
alessiob3ec96df2017-05-22 06:57:06 -0700202 bool gain_controller2_enabled_ = false;
Alex Loikob5c9a792018-04-16 16:31:22 +0200203 bool pre_amplifier_enabled_ = false;
Gustaf Ullbergce045ac2017-10-16 13:49:04 +0200204 bool echo_controller_enabled_ = false;
Sam Zackrisson0824c6f2019-10-07 14:03:56 +0200205 bool voice_detector_enabled_ = false;
peah2ace3f92016-09-10 04:42:27 -0700206 bool transient_suppressor_enabled_ = false;
207 bool first_update_ = true;
208 };
209
peahdf3efa82015-11-28 12:35:15 -0800210 // Method for modifying the formats struct that are called from both
211 // the render and capture threads. The check for whether modifications
212 // are needed is done while holding the render lock only, thereby avoiding
213 // that the capture thread blocks the render thread.
214 // The struct is modified in a single-threaded manner by holding both the
215 // render and capture locks.
peahdf3efa82015-11-28 12:35:15 -0800216 int MaybeInitializeRender(const ProcessingConfig& processing_config)
danilchap56359be2017-09-07 07:53:45 -0700217 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_render_);
peahdf3efa82015-11-28 12:35:15 -0800218
peah2ace3f92016-09-10 04:42:27 -0700219 // Method for updating the state keeping track of the active submodules.
220 // Returns a bool indicating whether the state has changed.
danilchap56359be2017-09-07 07:53:45 -0700221 bool UpdateActiveSubmoduleStates()
222 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_capture_);
peahdf3efa82015-11-28 12:35:15 -0800223
224 // Methods requiring APM running in a single-threaded manner.
225 // Are called with both the render and capture locks already
226 // acquired.
peahdf3efa82015-11-28 12:35:15 -0800227 void InitializeTransient()
danilchap56359be2017-09-07 07:53:45 -0700228 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_render_, crit_capture_);
Michael Graczyk86c6d332015-07-23 11:41:39 -0700229 int InitializeLocked(const ProcessingConfig& config)
danilchap56359be2017-09-07 07:53:45 -0700230 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_render_, crit_capture_);
ivoc9f4a4a02016-10-28 05:39:16 -0700231 void InitializeResidualEchoDetector()
danilchap56359be2017-09-07 07:53:45 -0700232 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_render_, crit_capture_);
Per Åhgren0aefbf02019-08-23 21:29:17 +0200233 void InitializeHighPassFilter() RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_capture_);
Sam Zackrisson0824c6f2019-10-07 14:03:56 +0200234 void InitializeVoiceDetector() RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_capture_);
Per Åhgrenf204faf2019-04-25 15:18:06 +0200235 void InitializeEchoController()
236 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_render_, crit_capture_);
Sam Zackrisson0beac582017-09-25 12:04:02 +0200237 void InitializeGainController2() RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_capture_);
saza0bad15f2019-10-16 11:46:11 +0200238 void InitializeNoiseSuppressor() RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_capture_);
Alex Loikob5c9a792018-04-16 16:31:22 +0200239 void InitializePreAmplifier() RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_capture_);
Sam Zackrisson0beac582017-09-25 12:04:02 +0200240 void InitializePostProcessor() RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_capture_);
Valeriia Nemychnikovaf06eb572018-08-29 10:37:09 +0200241 void InitializeAnalyzer() RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_capture_);
Alex Loiko5825aa62017-12-18 16:02:40 +0100242 void InitializePreProcessor() RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_render_);
peahdf3efa82015-11-28 12:35:15 -0800243
Gustaf Ullberg422b9e02019-10-09 13:02:14 +0200244 // Sample rate used for the fullband processing.
245 int proc_fullband_sample_rate_hz() const
246 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_capture_);
247
Alex Loiko73ec0192018-05-15 10:52:28 +0200248 // Empties and handles the respective RuntimeSetting queues.
249 void HandleCaptureRuntimeSettings()
250 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_capture_);
251 void HandleRenderRuntimeSettings() RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_render_);
Sam Zackrissonf0d1c032019-03-27 13:28:08 +0100252 void ApplyAgc1Config(const Config::GainController1& agc_config)
253 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_capture_);
254
255 // Returns a direct pointer to the AGC1 submodule: either a GainControlImpl
256 // or GainControlForExperimentalAgc instance.
257 GainControl* agc1();
258 const GainControl* agc1() const;
Alessio Bazzicac054e782018-04-16 12:10:09 +0200259
peah764e3642016-10-22 05:04:30 -0700260 void EmptyQueuedRenderAudio();
261 void AllocateRenderQueue()
danilchap56359be2017-09-07 07:53:45 -0700262 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_render_, crit_capture_);
peah9e6a2902017-05-15 07:19:21 -0700263 void QueueBandedRenderAudio(AudioBuffer* audio)
danilchap56359be2017-09-07 07:53:45 -0700264 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_render_);
peah9e6a2902017-05-15 07:19:21 -0700265 void QueueNonbandedRenderAudio(AudioBuffer* audio)
danilchap56359be2017-09-07 07:53:45 -0700266 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_render_);
peah764e3642016-10-22 05:04:30 -0700267
peahdf3efa82015-11-28 12:35:15 -0800268 // Capture-side exclusive methods possibly running APM in a multi-threaded
269 // manner that are called with the render lock already acquired.
danilchap56359be2017-09-07 07:53:45 -0700270 int ProcessCaptureStreamLocked() RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_capture_);
peahdf3efa82015-11-28 12:35:15 -0800271
272 // Render-side exclusive methods possibly running APM in a multi-threaded
273 // manner that are called with the render lock already acquired.
ekmeyerson60d9b332015-08-14 10:35:55 -0700274 // TODO(ekm): Remove once all clients updated to new interface.
peahdf3efa82015-11-28 12:35:15 -0800275 int AnalyzeReverseStreamLocked(const float* const* src,
276 const StreamConfig& input_config,
277 const StreamConfig& output_config)
danilchap56359be2017-09-07 07:53:45 -0700278 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_render_);
279 int ProcessRenderStreamLocked() RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_render_);
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000280
aleloi868f32f2017-05-23 07:20:05 -0700281 // Collects configuration settings from public and private
282 // submodules to be saved as an audioproc::Config message on the
283 // AecDump if it is attached. If not |forced|, only writes the current
284 // config if it is different from the last saved one; if |forced|,
285 // writes the config regardless of the last saved.
286 void WriteAecDumpConfigMessage(bool forced)
danilchap56359be2017-09-07 07:53:45 -0700287 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_capture_);
aleloi868f32f2017-05-23 07:20:05 -0700288
289 // Notifies attached AecDump of current configuration and capture data.
290 void RecordUnprocessedCaptureStream(const float* const* capture_stream)
danilchap56359be2017-09-07 07:53:45 -0700291 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_capture_);
aleloi868f32f2017-05-23 07:20:05 -0700292
293 void RecordUnprocessedCaptureStream(const AudioFrame& capture_frame)
danilchap56359be2017-09-07 07:53:45 -0700294 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_capture_);
aleloi868f32f2017-05-23 07:20:05 -0700295
296 // Notifies attached AecDump of current configuration and
297 // processed capture data and issues a capture stream recording
298 // request.
299 void RecordProcessedCaptureStream(
300 const float* const* processed_capture_stream)
danilchap56359be2017-09-07 07:53:45 -0700301 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_capture_);
aleloi868f32f2017-05-23 07:20:05 -0700302
303 void RecordProcessedCaptureStream(const AudioFrame& processed_capture_frame)
danilchap56359be2017-09-07 07:53:45 -0700304 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_capture_);
aleloi868f32f2017-05-23 07:20:05 -0700305
306 // Notifies attached AecDump about current state (delay, drift, etc).
danilchap56359be2017-09-07 07:53:45 -0700307 void RecordAudioProcessingState() RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_capture_);
aleloi868f32f2017-05-23 07:20:05 -0700308
aleloi868f32f2017-05-23 07:20:05 -0700309 // AecDump instance used for optionally logging APM config, input
310 // and output to file in the AEC-dump format defined in debug.proto.
311 std::unique_ptr<AecDump> aec_dump_;
312
313 // Hold the last config written with AecDump for avoiding writing
314 // the same config twice.
danilchap56359be2017-09-07 07:53:45 -0700315 InternalAPMConfig apm_config_for_aec_dump_ RTC_GUARDED_BY(crit_capture_);
aleloi868f32f2017-05-23 07:20:05 -0700316
peahdf3efa82015-11-28 12:35:15 -0800317 // Critical sections.
danilchap56359be2017-09-07 07:53:45 -0700318 rtc::CriticalSection crit_render_ RTC_ACQUIRED_BEFORE(crit_capture_);
pbos5ad935c2016-01-25 03:52:44 -0800319 rtc::CriticalSection crit_capture_;
peahdf3efa82015-11-28 12:35:15 -0800320
peahc19f3122016-10-07 14:54:10 -0700321 // Struct containing the Config specifying the behavior of APM.
322 AudioProcessing::Config config_;
323
peah2ace3f92016-09-10 04:42:27 -0700324 // Class containing information about what submodules are active.
saza1d600522019-10-18 13:29:43 +0200325 SubmoduleStates submodule_states_;
peah2ace3f92016-09-10 04:42:27 -0700326
saza1d600522019-10-18 13:29:43 +0200327 // Struct containing the pointers to the submodules.
328 struct Submodules {
329 Submodules(std::unique_ptr<CustomProcessing> capture_post_processor,
330 std::unique_ptr<CustomProcessing> render_pre_processor,
331 rtc::scoped_refptr<EchoDetector> echo_detector,
332 std::unique_ptr<CustomAudioAnalyzer> capture_analyzer)
333 : echo_detector(std::move(echo_detector)),
334 capture_post_processor(std::move(capture_post_processor)),
335 render_pre_processor(std::move(render_pre_processor)),
336 capture_analyzer(std::move(capture_analyzer)) {}
337 // Accessed internally from capture or during initialization.
338 std::unique_ptr<AgcManagerDirect> agc_manager;
339 std::unique_ptr<GainControlImpl> gain_control;
340 std::unique_ptr<GainControlForExperimentalAgc>
341 gain_control_for_experimental_agc;
342 std::unique_ptr<GainController2> gain_controller2;
343 std::unique_ptr<HighPassFilter> high_pass_filter;
344 rtc::scoped_refptr<EchoDetector> echo_detector;
345 std::unique_ptr<EchoCancellationImpl> echo_cancellation;
346 std::unique_ptr<EchoControl> echo_controller;
347 std::unique_ptr<EchoControlMobileImpl> echo_control_mobile;
Per Åhgren87a7b822019-10-29 22:59:44 +0100348 std::unique_ptr<NoiseSuppression> legacy_noise_suppressor;
349 std::unique_ptr<NoiseSuppressor> noise_suppressor;
saza1d600522019-10-18 13:29:43 +0200350 std::unique_ptr<TransientSuppressor> transient_suppressor;
351 std::unique_ptr<CustomProcessing> capture_post_processor;
352 std::unique_ptr<CustomProcessing> render_pre_processor;
353 std::unique_ptr<GainApplier> pre_amplifier;
354 std::unique_ptr<CustomAudioAnalyzer> capture_analyzer;
355 std::unique_ptr<LevelEstimator> output_level_estimator;
356 std::unique_ptr<VoiceDetection> voice_detector;
357 } submodules_;
peahdf3efa82015-11-28 12:35:15 -0800358
peah192164e2015-11-17 02:16:45 -0800359 // State that is written to while holding both the render and capture locks
peahdf3efa82015-11-28 12:35:15 -0800360 // but can be read without any lock being held.
361 // As this is only accessed internally of APM, and all internal methods in APM
362 // either are holding the render or capture locks, this construct is safe as
363 // it is not possible to read the variables while writing them.
364 struct ApmFormatState {
365 ApmFormatState()
peah192164e2015-11-17 02:16:45 -0800366 : // Format of processing streams at input/output call sites.
peahdf3efa82015-11-28 12:35:15 -0800367 api_format({{{kSampleRate16kHz, 1, false},
368 {kSampleRate16kHz, 1, false},
369 {kSampleRate16kHz, 1, false},
370 {kSampleRate16kHz, 1, false}}}),
peahde65ddc2016-09-16 15:02:15 -0700371 render_processing_format(kSampleRate16kHz, 1) {}
peahdf3efa82015-11-28 12:35:15 -0800372 ProcessingConfig api_format;
peahde65ddc2016-09-16 15:02:15 -0700373 StreamConfig render_processing_format;
peahdf3efa82015-11-28 12:35:15 -0800374 } formats_;
Michael Graczyk86c6d332015-07-23 11:41:39 -0700375
peahdf3efa82015-11-28 12:35:15 -0800376 // APM constants.
377 const struct ApmConstants {
henrik.lundinbd681b92016-12-05 09:08:42 -0800378 ApmConstants(int agc_startup_min_volume,
379 int agc_clipped_level_min,
Alex Loiko64cb83b2018-07-02 13:38:19 +0200380 bool use_experimental_agc,
381 bool use_experimental_agc_agc2_level_estimation,
Alex Loikod9342442018-09-10 13:59:41 +0200382 bool use_experimental_agc_agc2_digital_adaptive,
Sam Zackrissonfeee1e42019-09-20 07:50:35 +0200383 bool use_experimental_agc_process_before_aec,
384 bool experimental_multi_channel_render_support,
385 bool experimental_multi_channel_capture_support)
386 : agc_startup_min_volume(agc_startup_min_volume),
henrik.lundinbd681b92016-12-05 09:08:42 -0800387 agc_clipped_level_min(agc_clipped_level_min),
Alex Loiko64cb83b2018-07-02 13:38:19 +0200388 use_experimental_agc(use_experimental_agc),
389 use_experimental_agc_agc2_level_estimation(
390 use_experimental_agc_agc2_level_estimation),
391 use_experimental_agc_agc2_digital_adaptive(
Alex Loikod9342442018-09-10 13:59:41 +0200392 use_experimental_agc_agc2_digital_adaptive),
393 use_experimental_agc_process_before_aec(
Sam Zackrissonfeee1e42019-09-20 07:50:35 +0200394 use_experimental_agc_process_before_aec),
395 experimental_multi_channel_render_support(
396 experimental_multi_channel_render_support),
397 experimental_multi_channel_capture_support(
398 experimental_multi_channel_capture_support) {}
peahdf3efa82015-11-28 12:35:15 -0800399 int agc_startup_min_volume;
henrik.lundinbd681b92016-12-05 09:08:42 -0800400 int agc_clipped_level_min;
peahbe615622016-02-13 16:40:47 -0800401 bool use_experimental_agc;
Alex Loiko64cb83b2018-07-02 13:38:19 +0200402 bool use_experimental_agc_agc2_level_estimation;
403 bool use_experimental_agc_agc2_digital_adaptive;
Alex Loikod9342442018-09-10 13:59:41 +0200404 bool use_experimental_agc_process_before_aec;
Sam Zackrissonfeee1e42019-09-20 07:50:35 +0200405 bool experimental_multi_channel_render_support;
406 bool experimental_multi_channel_capture_support;
peahdf3efa82015-11-28 12:35:15 -0800407 } constants_;
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +0000408
peahdf3efa82015-11-28 12:35:15 -0800409 struct ApmCaptureState {
Sam Zackrisson9394f6f2018-06-14 10:11:35 +0200410 ApmCaptureState(bool transient_suppressor_enabled);
kwiberg83ffe452016-08-29 14:46:07 -0700411 ~ApmCaptureState();
peahdf3efa82015-11-28 12:35:15 -0800412 int delay_offset_ms;
413 bool was_stream_delay_set;
peahdf3efa82015-11-28 12:35:15 -0800414 bool output_will_be_muted;
415 bool key_pressed;
416 bool transient_suppressor_enabled;
kwiberg88788ad2016-02-19 07:04:49 -0800417 std::unique_ptr<AudioBuffer> capture_audio;
Gustaf Ullberg422b9e02019-10-09 13:02:14 +0200418 std::unique_ptr<AudioBuffer> capture_fullband_audio;
peahde65ddc2016-09-16 15:02:15 -0700419 // Only the rate and samples fields of capture_processing_format_ are used
420 // because the capture processing number of channels is mutable and is
421 // tracked by the capture_audio_.
422 StreamConfig capture_processing_format;
peahdf3efa82015-11-28 12:35:15 -0800423 int split_rate;
peah67995532017-04-10 14:12:41 -0700424 bool echo_path_gain_change;
Per Åhgren88cf0502018-07-16 17:08:41 +0200425 int prev_analog_mic_level;
Per Åhgrend2650d12018-10-02 17:00:59 +0200426 float prev_pre_amp_gain;
Fredrik Hernqvistca362852019-05-10 15:50:02 +0200427 int playout_volume;
428 int prev_playout_volume;
Sam Zackrissonb24c00f2018-11-26 16:18:25 +0100429 AudioProcessingStats stats;
Per Åhgrena1351272019-08-15 12:15:46 +0200430 struct KeyboardInfo {
431 void Extract(const float* const* data, const StreamConfig& stream_config);
432 size_t num_keyboard_frames = 0;
433 const float* keyboard_data = nullptr;
434 } keyboard_info;
danilchap56359be2017-09-07 07:53:45 -0700435 } capture_ RTC_GUARDED_BY(crit_capture_);
niklase@google.com470e71d2011-07-07 08:21:25 +0000436
peahdf3efa82015-11-28 12:35:15 -0800437 struct ApmCaptureNonLockedState {
Alessio Bazzicacc22f512018-08-30 13:01:34 +0200438 ApmCaptureNonLockedState()
peahde65ddc2016-09-16 15:02:15 -0700439 : capture_processing_format(kSampleRate16kHz),
peahdf3efa82015-11-28 12:35:15 -0800440 split_rate(kSampleRate16kHz),
Alessio Bazzicacc22f512018-08-30 13:01:34 +0200441 stream_delay_ms(0) {}
peahde65ddc2016-09-16 15:02:15 -0700442 // Only the rate and samples fields of capture_processing_format_ are used
443 // because the forward processing number of channels is mutable and is
444 // tracked by the capture_audio_.
445 StreamConfig capture_processing_format;
peahdf3efa82015-11-28 12:35:15 -0800446 int split_rate;
447 int stream_delay_ms;
Gustaf Ullbergce045ac2017-10-16 13:49:04 +0200448 bool echo_controller_enabled = false;
Per Åhgrenf204faf2019-04-25 15:18:06 +0200449 bool use_aec2_extended_filter = false;
450 bool use_aec2_delay_agnostic = false;
451 bool use_aec2_refined_adaptive_filter = false;
peahdf3efa82015-11-28 12:35:15 -0800452 } capture_nonlocked_;
andrew@webrtc.org75dd2882014-02-11 20:52:30 +0000453
peahdf3efa82015-11-28 12:35:15 -0800454 struct ApmRenderState {
kwiberg83ffe452016-08-29 14:46:07 -0700455 ApmRenderState();
456 ~ApmRenderState();
kwiberg88788ad2016-02-19 07:04:49 -0800457 std::unique_ptr<AudioConverter> render_converter;
458 std::unique_ptr<AudioBuffer> render_audio;
danilchap56359be2017-09-07 07:53:45 -0700459 } render_ RTC_GUARDED_BY(crit_render_);
peah764e3642016-10-22 05:04:30 -0700460
danilchap56359be2017-09-07 07:53:45 -0700461 std::vector<float> aec_render_queue_buffer_ RTC_GUARDED_BY(crit_render_);
462 std::vector<float> aec_capture_queue_buffer_ RTC_GUARDED_BY(crit_capture_);
peaha0624602016-10-25 04:45:24 -0700463
danilchap56359be2017-09-07 07:53:45 -0700464 std::vector<int16_t> aecm_render_queue_buffer_ RTC_GUARDED_BY(crit_render_);
465 std::vector<int16_t> aecm_capture_queue_buffer_ RTC_GUARDED_BY(crit_capture_);
peah701d6282016-10-25 05:42:20 -0700466
danilchap56359be2017-09-07 07:53:45 -0700467 size_t agc_render_queue_element_max_size_ RTC_GUARDED_BY(crit_render_)
468 RTC_GUARDED_BY(crit_capture_) = 0;
469 std::vector<int16_t> agc_render_queue_buffer_ RTC_GUARDED_BY(crit_render_);
470 std::vector<int16_t> agc_capture_queue_buffer_ RTC_GUARDED_BY(crit_capture_);
peah764e3642016-10-22 05:04:30 -0700471
danilchap56359be2017-09-07 07:53:45 -0700472 size_t red_render_queue_element_max_size_ RTC_GUARDED_BY(crit_render_)
473 RTC_GUARDED_BY(crit_capture_) = 0;
474 std::vector<float> red_render_queue_buffer_ RTC_GUARDED_BY(crit_render_);
475 std::vector<float> red_capture_queue_buffer_ RTC_GUARDED_BY(crit_capture_);
ivoc9f4a4a02016-10-28 05:39:16 -0700476
danilchap56359be2017-09-07 07:53:45 -0700477 RmsLevel capture_input_rms_ RTC_GUARDED_BY(crit_capture_);
478 RmsLevel capture_output_rms_ RTC_GUARDED_BY(crit_capture_);
479 int capture_rms_interval_counter_ RTC_GUARDED_BY(crit_capture_) = 0;
henrik.lundin290d43a2016-11-29 08:09:09 -0800480
peah764e3642016-10-22 05:04:30 -0700481 // Lock protection not needed.
482 std::unique_ptr<SwapQueue<std::vector<float>, RenderQueueItemVerifier<float>>>
peah701d6282016-10-25 05:42:20 -0700483 aec_render_signal_queue_;
peaha0624602016-10-25 04:45:24 -0700484 std::unique_ptr<
485 SwapQueue<std::vector<int16_t>, RenderQueueItemVerifier<int16_t>>>
peah701d6282016-10-25 05:42:20 -0700486 aecm_render_signal_queue_;
487 std::unique_ptr<
488 SwapQueue<std::vector<int16_t>, RenderQueueItemVerifier<int16_t>>>
489 agc_render_signal_queue_;
ivoc9f4a4a02016-10-28 05:39:16 -0700490 std::unique_ptr<SwapQueue<std::vector<float>, RenderQueueItemVerifier<float>>>
491 red_render_signal_queue_;
niklase@google.com470e71d2011-07-07 08:21:25 +0000492};
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +0000493
niklase@google.com470e71d2011-07-07 08:21:25 +0000494} // namespace webrtc
495
Mirko Bonadei92ea95e2017-09-15 06:47:31 +0200496#endif // MODULES_AUDIO_PROCESSING_AUDIO_PROCESSING_IMPL_H_