blob: dabc4b8a49a4e069e666c56dabb6a900e4e538ae [file] [log] [blame]
niklase@google.com470e71d2011-07-07 08:21:25 +00001/*
andrew@webrtc.org40654032012-01-30 20:51:15 +00002 * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
niklase@google.com470e71d2011-07-07 08:21:25 +00003 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
andrew@webrtc.org78693fe2013-03-01 16:36:19 +000011#include "webrtc/modules/audio_processing/audio_processing_impl.h"
niklase@google.com470e71d2011-07-07 08:21:25 +000012
ajm@google.com808e0e02011-08-03 21:08:51 +000013#include <assert.h>
Michael Graczyk86c6d332015-07-23 11:41:39 -070014#include <algorithm>
niklase@google.com470e71d2011-07-07 08:21:25 +000015
Bjorn Volcker1ca324f2015-06-29 14:57:29 +020016#include "webrtc/base/checks.h"
xians@webrtc.orge46bc772014-10-10 08:36:56 +000017#include "webrtc/base/platform_file.h"
peah369f8282015-12-17 06:42:29 -080018#include "webrtc/base/trace_event.h"
ekmeyerson60d9b332015-08-14 10:35:55 -070019#include "webrtc/common_audio/audio_converter.h"
Michael Graczykdfa36052015-03-25 16:37:27 -070020#include "webrtc/common_audio/channel_buffer.h"
ekmeyerson60d9b332015-08-14 10:35:55 -070021#include "webrtc/common_audio/include/audio_util.h"
andrew@webrtc.org60730cf2014-01-07 17:45:09 +000022#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
Bjorn Volcker1ca324f2015-06-29 14:57:29 +020023#include "webrtc/modules/audio_processing/aec/aec_core.h"
pbos@webrtc.org788acd12014-12-15 09:41:24 +000024#include "webrtc/modules/audio_processing/agc/agc_manager_direct.h"
andrew@webrtc.org78693fe2013-03-01 16:36:19 +000025#include "webrtc/modules/audio_processing/audio_buffer.h"
mgraczyk@chromium.org0f663de2015-03-13 00:13:32 +000026#include "webrtc/modules/audio_processing/beamformer/nonlinear_beamformer.h"
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +000027#include "webrtc/modules/audio_processing/common.h"
andrew@webrtc.org56e4a052014-02-27 22:23:17 +000028#include "webrtc/modules/audio_processing/echo_cancellation_impl.h"
andrew@webrtc.org78693fe2013-03-01 16:36:19 +000029#include "webrtc/modules/audio_processing/echo_control_mobile_impl.h"
peahbe615622016-02-13 16:40:47 -080030#include "webrtc/modules/audio_processing/gain_control_for_experimental_agc.h"
andrew@webrtc.org78693fe2013-03-01 16:36:19 +000031#include "webrtc/modules/audio_processing/gain_control_impl.h"
32#include "webrtc/modules/audio_processing/high_pass_filter_impl.h"
peah1bcfce52016-08-26 07:16:04 -070033#if WEBRTC_INTELLIGIBILITY_ENHANCER
ekmeyerson60d9b332015-08-14 10:35:55 -070034#include "webrtc/modules/audio_processing/intelligibility/intelligibility_enhancer.h"
peah1bcfce52016-08-26 07:16:04 -070035#endif
peahca4cac72016-06-29 15:26:12 -070036#include "webrtc/modules/audio_processing/level_controller/level_controller.h"
andrew@webrtc.org78693fe2013-03-01 16:36:19 +000037#include "webrtc/modules/audio_processing/level_estimator_impl.h"
38#include "webrtc/modules/audio_processing/noise_suppression_impl.h"
aluebs@webrtc.orgae643ce2014-12-19 19:57:34 +000039#include "webrtc/modules/audio_processing/transient/transient_suppressor.h"
andrew@webrtc.org78693fe2013-03-01 16:36:19 +000040#include "webrtc/modules/audio_processing/voice_detection_impl.h"
Henrik Kjellanderff761fb2015-11-04 08:31:52 +010041#include "webrtc/modules/include/module_common_types.h"
Henrik Kjellander98f53512015-10-28 18:17:40 +010042#include "webrtc/system_wrappers/include/file_wrapper.h"
43#include "webrtc/system_wrappers/include/logging.h"
44#include "webrtc/system_wrappers/include/metrics.h"
andrew@webrtc.org7bf26462011-12-03 00:03:31 +000045
46#ifdef WEBRTC_AUDIOPROC_DEBUG_DUMP
47// Files generated at build-time by the protobuf compiler.
leozwang@webrtc.orga3736342012-03-16 21:36:00 +000048#ifdef WEBRTC_ANDROID_PLATFORM_BUILD
leozwang@webrtc.org534e4952012-10-22 21:21:52 +000049#include "external/webrtc/webrtc/modules/audio_processing/debug.pb.h"
leozwang@google.comce9bfbb2011-08-03 23:34:31 +000050#else
kjellander78ddd732016-02-09 08:13:06 -080051#include "webrtc/modules/audio_processing/debug.pb.h"
leozwang@google.comce9bfbb2011-08-03 23:34:31 +000052#endif
andrew@webrtc.org7bf26462011-12-03 00:03:31 +000053#endif // WEBRTC_AUDIOPROC_DEBUG_DUMP
niklase@google.com470e71d2011-07-07 08:21:25 +000054
peah1bcfce52016-08-26 07:16:04 -070055// Check to verify that the define for the intelligibility enhancer is properly
56// set.
57#if !defined(WEBRTC_INTELLIGIBILITY_ENHANCER) || \
58 (WEBRTC_INTELLIGIBILITY_ENHANCER != 0 && \
59 WEBRTC_INTELLIGIBILITY_ENHANCER != 1)
60#error "Set WEBRTC_INTELLIGIBILITY_ENHANCER to either 0 or 1"
61#endif
62
Michael Graczyk86c6d332015-07-23 11:41:39 -070063#define RETURN_ON_ERR(expr) \
64 do { \
65 int err = (expr); \
66 if (err != kNoError) { \
67 return err; \
68 } \
andrew@webrtc.org60730cf2014-01-07 17:45:09 +000069 } while (0)
70
niklase@google.com470e71d2011-07-07 08:21:25 +000071namespace webrtc {
aluebsdf6416a2016-03-16 18:26:35 -070072
73const int AudioProcessing::kNativeSampleRatesHz[] = {
74 AudioProcessing::kSampleRate8kHz,
75 AudioProcessing::kSampleRate16kHz,
aluebsdf6416a2016-03-16 18:26:35 -070076 AudioProcessing::kSampleRate32kHz,
77 AudioProcessing::kSampleRate48kHz};
aluebsdf6416a2016-03-16 18:26:35 -070078const size_t AudioProcessing::kNumNativeSampleRates =
79 arraysize(AudioProcessing::kNativeSampleRatesHz);
80const int AudioProcessing::kMaxNativeSampleRateHz = AudioProcessing::
81 kNativeSampleRatesHz[AudioProcessing::kNumNativeSampleRates - 1];
82
Michael Graczyk86c6d332015-07-23 11:41:39 -070083namespace {
84
peahcc34faf2016-08-30 09:49:13 -070085const int kInternalNativeRates[] = {AudioProcessing::kSampleRate8kHz,
86 AudioProcessing::kSampleRate16kHz,
87#ifdef WEBRTC_ARCH_ARM_FAMILY
88 AudioProcessing::kSampleRate32kHz};
89#else
90 AudioProcessing::kSampleRate32kHz,
91 AudioProcessing::kSampleRate48kHz};
92#endif // WEBRTC_ARCH_ARM_FAMILY
93
Michael Graczyk86c6d332015-07-23 11:41:39 -070094static bool LayoutHasKeyboard(AudioProcessing::ChannelLayout layout) {
95 switch (layout) {
96 case AudioProcessing::kMono:
97 case AudioProcessing::kStereo:
98 return false;
99 case AudioProcessing::kMonoAndKeyboard:
100 case AudioProcessing::kStereoAndKeyboard:
101 return true;
102 }
103
104 assert(false);
105 return false;
106}
aluebsdf6416a2016-03-16 18:26:35 -0700107
108bool is_multi_band(int sample_rate_hz) {
109 return sample_rate_hz == AudioProcessing::kSampleRate32kHz ||
110 sample_rate_hz == AudioProcessing::kSampleRate48kHz;
111}
112
peah423d2362016-04-09 16:06:52 -0700113int ClosestHigherNativeRate(int min_proc_rate) {
peahcc34faf2016-08-30 09:49:13 -0700114 for (int rate : kInternalNativeRates) {
aluebsdf6416a2016-03-16 18:26:35 -0700115 if (rate >= min_proc_rate) {
116 return rate;
117 }
118 }
peahcc34faf2016-08-30 09:49:13 -0700119 return kInternalNativeRates[arraysize(kInternalNativeRates) - 1];
aluebsdf6416a2016-03-16 18:26:35 -0700120}
121
Michael Graczyk86c6d332015-07-23 11:41:39 -0700122} // namespace
andrew@webrtc.org60730cf2014-01-07 17:45:09 +0000123
124// Throughout webrtc, it's assumed that success is represented by zero.
kwiberg@webrtc.org2ebfac52015-01-14 10:51:54 +0000125static_assert(AudioProcessing::kNoError == 0, "kNoError must be zero");
andrew@webrtc.org60730cf2014-01-07 17:45:09 +0000126
solenberg5e465c32015-12-08 13:22:33 -0800127struct AudioProcessingImpl::ApmPublicSubmodules {
peahbfa97112016-03-10 21:09:04 -0800128 ApmPublicSubmodules() {}
solenberg5e465c32015-12-08 13:22:33 -0800129 // Accessed externally of APM without any lock acquired.
peahb624d8c2016-03-05 03:01:14 -0800130 std::unique_ptr<EchoCancellationImpl> echo_cancellation;
peahbb9edbd2016-03-10 12:54:25 -0800131 std::unique_ptr<EchoControlMobileImpl> echo_control_mobile;
peahbfa97112016-03-10 21:09:04 -0800132 std::unique_ptr<GainControlImpl> gain_control;
kwiberg88788ad2016-02-19 07:04:49 -0800133 std::unique_ptr<HighPassFilterImpl> high_pass_filter;
134 std::unique_ptr<LevelEstimatorImpl> level_estimator;
135 std::unique_ptr<NoiseSuppressionImpl> noise_suppression;
136 std::unique_ptr<VoiceDetectionImpl> voice_detection;
137 std::unique_ptr<GainControlForExperimentalAgc>
peahbe615622016-02-13 16:40:47 -0800138 gain_control_for_experimental_agc;
solenberg5e465c32015-12-08 13:22:33 -0800139
140 // Accessed internally from both render and capture.
kwiberg88788ad2016-02-19 07:04:49 -0800141 std::unique_ptr<TransientSuppressor> transient_suppressor;
peah1bcfce52016-08-26 07:16:04 -0700142#if WEBRTC_INTELLIGIBILITY_ENHANCER
kwiberg88788ad2016-02-19 07:04:49 -0800143 std::unique_ptr<IntelligibilityEnhancer> intelligibility_enhancer;
peah1bcfce52016-08-26 07:16:04 -0700144#endif
solenberg5e465c32015-12-08 13:22:33 -0800145};
146
147struct AudioProcessingImpl::ApmPrivateSubmodules {
Alejandro Luebsf4022ff2016-07-01 17:19:09 -0700148 explicit ApmPrivateSubmodules(NonlinearBeamformer* beamformer)
solenberg5e465c32015-12-08 13:22:33 -0800149 : beamformer(beamformer) {}
150 // Accessed internally from capture or during initialization
Alejandro Luebsf4022ff2016-07-01 17:19:09 -0700151 std::unique_ptr<NonlinearBeamformer> beamformer;
kwiberg88788ad2016-02-19 07:04:49 -0800152 std::unique_ptr<AgcManagerDirect> agc_manager;
peahca4cac72016-06-29 15:26:12 -0700153 std::unique_ptr<LevelController> level_controller;
solenberg5e465c32015-12-08 13:22:33 -0800154};
155
andrew@webrtc.orge84978f2014-01-25 02:09:06 +0000156AudioProcessing* AudioProcessing::Create() {
peahc8bbe3f2016-09-09 14:15:57 -0700157 webrtc::Config config;
aluebs@webrtc.orgd82f55d2015-01-15 18:07:21 +0000158 return Create(config, nullptr);
andrew@webrtc.orge84978f2014-01-25 02:09:06 +0000159}
160
peahc8bbe3f2016-09-09 14:15:57 -0700161AudioProcessing* AudioProcessing::Create(const webrtc::Config& config) {
aluebs@webrtc.orgd82f55d2015-01-15 18:07:21 +0000162 return Create(config, nullptr);
163}
164
peahc8bbe3f2016-09-09 14:15:57 -0700165AudioProcessing* AudioProcessing::Create(const webrtc::Config& config,
Alejandro Luebsf4022ff2016-07-01 17:19:09 -0700166 NonlinearBeamformer* beamformer) {
aluebs@webrtc.orgd82f55d2015-01-15 18:07:21 +0000167 AudioProcessingImpl* apm = new AudioProcessingImpl(config, beamformer);
niklase@google.com470e71d2011-07-07 08:21:25 +0000168 if (apm->Initialize() != kNoError) {
169 delete apm;
peahdf3efa82015-11-28 12:35:15 -0800170 apm = nullptr;
niklase@google.com470e71d2011-07-07 08:21:25 +0000171 }
172
173 return apm;
174}
175
peahc8bbe3f2016-09-09 14:15:57 -0700176AudioProcessingImpl::AudioProcessingImpl(const webrtc::Config& config)
aluebs@webrtc.orgd82f55d2015-01-15 18:07:21 +0000177 : AudioProcessingImpl(config, nullptr) {}
178
peahc8bbe3f2016-09-09 14:15:57 -0700179AudioProcessingImpl::AudioProcessingImpl(const webrtc::Config& config,
Alejandro Luebsf4022ff2016-07-01 17:19:09 -0700180 NonlinearBeamformer* beamformer)
peahdf3efa82015-11-28 12:35:15 -0800181 : public_submodules_(new ApmPublicSubmodules()),
182 private_submodules_(new ApmPrivateSubmodules(beamformer)),
183 constants_(config.Get<ExperimentalAgc>().startup_min_volume,
pbos@webrtc.org788acd12014-12-15 09:41:24 +0000184#if defined(WEBRTC_ANDROID) || defined(WEBRTC_IOS)
Alejandro Luebsc9b0c262016-05-16 15:32:38 -0700185 false),
pbos@webrtc.org788acd12014-12-15 09:41:24 +0000186#else
Alejandro Luebsc9b0c262016-05-16 15:32:38 -0700187 config.Get<ExperimentalAgc>().enabled),
pbos@webrtc.org788acd12014-12-15 09:41:24 +0000188#endif
andrew1c7075f2015-06-24 18:14:14 -0700189#if defined(WEBRTC_ANDROID) || defined(WEBRTC_IOS)
aluebs2a346882016-01-11 18:04:30 -0800190 capture_(false,
andrew1c7075f2015-06-24 18:14:14 -0700191#else
aluebs2a346882016-01-11 18:04:30 -0800192 capture_(config.Get<ExperimentalNs>().enabled,
andrew1c7075f2015-06-24 18:14:14 -0700193#endif
aluebs2a346882016-01-11 18:04:30 -0800194 config.Get<Beamforming>().array_geometry,
aluebsb2328d12016-01-11 20:32:29 -0800195 config.Get<Beamforming>().target_direction),
Alejandro Luebsc9b0c262016-05-16 15:32:38 -0700196 capture_nonlocked_(config.Get<Beamforming>().enabled,
peahc8bbe3f2016-09-09 14:15:57 -0700197 config.Get<Intelligibility>().enabled) {
peahdf3efa82015-11-28 12:35:15 -0800198 {
199 rtc::CritScope cs_render(&crit_render_);
200 rtc::CritScope cs_capture(&crit_capture_);
niklase@google.com470e71d2011-07-07 08:21:25 +0000201
peahb624d8c2016-03-05 03:01:14 -0800202 public_submodules_->echo_cancellation.reset(
peahb58a1582016-03-15 09:34:24 -0700203 new EchoCancellationImpl(&crit_render_, &crit_capture_));
peahbb9edbd2016-03-10 12:54:25 -0800204 public_submodules_->echo_control_mobile.reset(
peah253534d2016-03-15 04:32:28 -0700205 new EchoControlMobileImpl(&crit_render_, &crit_capture_));
peahbfa97112016-03-10 21:09:04 -0800206 public_submodules_->gain_control.reset(
peahb8fbb542016-03-15 02:28:08 -0700207 new GainControlImpl(&crit_capture_, &crit_capture_));
solenberg70f99032015-12-08 11:07:32 -0800208 public_submodules_->high_pass_filter.reset(
209 new HighPassFilterImpl(&crit_capture_));
solenberg949028f2015-12-15 11:39:38 -0800210 public_submodules_->level_estimator.reset(
211 new LevelEstimatorImpl(&crit_capture_));
solenberg5e465c32015-12-08 13:22:33 -0800212 public_submodules_->noise_suppression.reset(
213 new NoiseSuppressionImpl(&crit_capture_));
solenberga29386c2015-12-16 03:31:12 -0800214 public_submodules_->voice_detection.reset(
215 new VoiceDetectionImpl(&crit_capture_));
peahbe615622016-02-13 16:40:47 -0800216 public_submodules_->gain_control_for_experimental_agc.reset(
peahbfa97112016-03-10 21:09:04 -0800217 new GainControlForExperimentalAgc(
218 public_submodules_->gain_control.get(), &crit_capture_));
peahca4cac72016-06-29 15:26:12 -0700219
220 private_submodules_->level_controller.reset(new LevelController());
peahdf3efa82015-11-28 12:35:15 -0800221 }
pbos@webrtc.org788acd12014-12-15 09:41:24 +0000222
andrew@webrtc.orge84978f2014-01-25 02:09:06 +0000223 SetExtraOptions(config);
niklase@google.com470e71d2011-07-07 08:21:25 +0000224}
225
226AudioProcessingImpl::~AudioProcessingImpl() {
peahdf3efa82015-11-28 12:35:15 -0800227 // Depends on gain_control_ and
peahbe615622016-02-13 16:40:47 -0800228 // public_submodules_->gain_control_for_experimental_agc.
peahdf3efa82015-11-28 12:35:15 -0800229 private_submodules_->agc_manager.reset();
230 // Depends on gain_control_.
peahbe615622016-02-13 16:40:47 -0800231 public_submodules_->gain_control_for_experimental_agc.reset();
niklase@google.com470e71d2011-07-07 08:21:25 +0000232
andrew@webrtc.org7bf26462011-12-03 00:03:31 +0000233#ifdef WEBRTC_AUDIOPROC_DEBUG_DUMP
tommia6219cc2016-06-15 10:30:14 -0700234 debug_dump_.debug_file->CloseFile();
peahdf3efa82015-11-28 12:35:15 -0800235#endif
niklase@google.com470e71d2011-07-07 08:21:25 +0000236}
237
niklase@google.com470e71d2011-07-07 08:21:25 +0000238int AudioProcessingImpl::Initialize() {
peahdf3efa82015-11-28 12:35:15 -0800239 // Run in a single-threaded manner during initialization.
240 rtc::CritScope cs_render(&crit_render_);
241 rtc::CritScope cs_capture(&crit_capture_);
niklase@google.com470e71d2011-07-07 08:21:25 +0000242 return InitializeLocked();
243}
244
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +0000245int AudioProcessingImpl::Initialize(int input_sample_rate_hz,
246 int output_sample_rate_hz,
247 int reverse_sample_rate_hz,
248 ChannelLayout input_layout,
249 ChannelLayout output_layout,
250 ChannelLayout reverse_layout) {
Michael Graczyk86c6d332015-07-23 11:41:39 -0700251 const ProcessingConfig processing_config = {
ekmeyerson60d9b332015-08-14 10:35:55 -0700252 {{input_sample_rate_hz,
253 ChannelsFromLayout(input_layout),
Michael Graczyk86c6d332015-07-23 11:41:39 -0700254 LayoutHasKeyboard(input_layout)},
ekmeyerson60d9b332015-08-14 10:35:55 -0700255 {output_sample_rate_hz,
256 ChannelsFromLayout(output_layout),
Michael Graczyk86c6d332015-07-23 11:41:39 -0700257 LayoutHasKeyboard(output_layout)},
ekmeyerson60d9b332015-08-14 10:35:55 -0700258 {reverse_sample_rate_hz,
259 ChannelsFromLayout(reverse_layout),
260 LayoutHasKeyboard(reverse_layout)},
261 {reverse_sample_rate_hz,
262 ChannelsFromLayout(reverse_layout),
Michael Graczyk86c6d332015-07-23 11:41:39 -0700263 LayoutHasKeyboard(reverse_layout)}}};
264
265 return Initialize(processing_config);
266}
267
268int AudioProcessingImpl::Initialize(const ProcessingConfig& processing_config) {
peahdf3efa82015-11-28 12:35:15 -0800269 // Run in a single-threaded manner during initialization.
270 rtc::CritScope cs_render(&crit_render_);
271 rtc::CritScope cs_capture(&crit_capture_);
Michael Graczyk86c6d332015-07-23 11:41:39 -0700272 return InitializeLocked(processing_config);
andrew@webrtc.orga8b97372014-03-10 22:26:12 +0000273}
274
peahdf3efa82015-11-28 12:35:15 -0800275int AudioProcessingImpl::MaybeInitializeRender(
peah81b9bfe2015-11-27 02:47:28 -0800276 const ProcessingConfig& processing_config) {
peahdf3efa82015-11-28 12:35:15 -0800277 return MaybeInitialize(processing_config);
peah81b9bfe2015-11-27 02:47:28 -0800278}
279
peahdf3efa82015-11-28 12:35:15 -0800280int AudioProcessingImpl::MaybeInitializeCapture(
peah81b9bfe2015-11-27 02:47:28 -0800281 const ProcessingConfig& processing_config) {
peahdf3efa82015-11-28 12:35:15 -0800282 return MaybeInitialize(processing_config);
peah81b9bfe2015-11-27 02:47:28 -0800283}
284
kwiberg83ffe452016-08-29 14:46:07 -0700285#ifdef WEBRTC_AUDIOPROC_DEBUG_DUMP
286
287AudioProcessingImpl::ApmDebugDumpThreadState::ApmDebugDumpThreadState()
288 : event_msg(new audioproc::Event()) {}
289
290AudioProcessingImpl::ApmDebugDumpThreadState::~ApmDebugDumpThreadState() {}
291
292AudioProcessingImpl::ApmDebugDumpState::ApmDebugDumpState()
293 : debug_file(FileWrapper::Create()) {}
294
295AudioProcessingImpl::ApmDebugDumpState::~ApmDebugDumpState() {}
296
297#endif // WEBRTC_AUDIOPROC_DEBUG_DUMP
298
peah192164e2015-11-17 02:16:45 -0800299// Calls InitializeLocked() if any of the audio parameters have changed from
peahdf3efa82015-11-28 12:35:15 -0800300// their current values (needs to be called while holding the crit_render_lock).
301int AudioProcessingImpl::MaybeInitialize(
peah192164e2015-11-17 02:16:45 -0800302 const ProcessingConfig& processing_config) {
peahdf3efa82015-11-28 12:35:15 -0800303 // Called from both threads. Thread check is therefore not possible.
304 if (processing_config == formats_.api_format) {
peah192164e2015-11-17 02:16:45 -0800305 return kNoError;
306 }
peahdf3efa82015-11-28 12:35:15 -0800307
308 rtc::CritScope cs_capture(&crit_capture_);
peah192164e2015-11-17 02:16:45 -0800309 return InitializeLocked(processing_config);
310}
311
niklase@google.com470e71d2011-07-07 08:21:25 +0000312int AudioProcessingImpl::InitializeLocked() {
Michael Graczyk86c6d332015-07-23 11:41:39 -0700313 const int fwd_audio_buffer_channels =
aluebsb2328d12016-01-11 20:32:29 -0800314 capture_nonlocked_.beamformer_enabled
peahdf3efa82015-11-28 12:35:15 -0800315 ? formats_.api_format.input_stream().num_channels()
316 : formats_.api_format.output_stream().num_channels();
ekmeyerson60d9b332015-08-14 10:35:55 -0700317 const int rev_audio_buffer_out_num_frames =
peahdf3efa82015-11-28 12:35:15 -0800318 formats_.api_format.reverse_output_stream().num_frames() == 0
319 ? formats_.rev_proc_format.num_frames()
320 : formats_.api_format.reverse_output_stream().num_frames();
321 if (formats_.api_format.reverse_input_stream().num_channels() > 0) {
322 render_.render_audio.reset(new AudioBuffer(
323 formats_.api_format.reverse_input_stream().num_frames(),
324 formats_.api_format.reverse_input_stream().num_channels(),
325 formats_.rev_proc_format.num_frames(),
326 formats_.rev_proc_format.num_channels(),
ekmeyerson60d9b332015-08-14 10:35:55 -0700327 rev_audio_buffer_out_num_frames));
328 if (rev_conversion_needed()) {
kwibergc2b785d2016-02-24 05:22:32 -0800329 render_.render_converter = AudioConverter::Create(
peahdf3efa82015-11-28 12:35:15 -0800330 formats_.api_format.reverse_input_stream().num_channels(),
331 formats_.api_format.reverse_input_stream().num_frames(),
332 formats_.api_format.reverse_output_stream().num_channels(),
kwibergc2b785d2016-02-24 05:22:32 -0800333 formats_.api_format.reverse_output_stream().num_frames());
ekmeyerson60d9b332015-08-14 10:35:55 -0700334 } else {
peahdf3efa82015-11-28 12:35:15 -0800335 render_.render_converter.reset(nullptr);
ekmeyerson60d9b332015-08-14 10:35:55 -0700336 }
Michael Graczyk86c6d332015-07-23 11:41:39 -0700337 } else {
peahdf3efa82015-11-28 12:35:15 -0800338 render_.render_audio.reset(nullptr);
339 render_.render_converter.reset(nullptr);
Michael Graczyk86c6d332015-07-23 11:41:39 -0700340 }
peahdf3efa82015-11-28 12:35:15 -0800341 capture_.capture_audio.reset(
342 new AudioBuffer(formats_.api_format.input_stream().num_frames(),
343 formats_.api_format.input_stream().num_channels(),
344 capture_nonlocked_.fwd_proc_format.num_frames(),
345 fwd_audio_buffer_channels,
346 formats_.api_format.output_stream().num_frames()));
niklase@google.com470e71d2011-07-07 08:21:25 +0000347
peahbfa97112016-03-10 21:09:04 -0800348 InitializeGainController();
peahb624d8c2016-03-05 03:01:14 -0800349 InitializeEchoCanceller();
peahbb9edbd2016-03-10 12:54:25 -0800350 InitializeEchoControlMobile();
Bjorn Volckeradc46c42015-04-15 11:42:40 +0200351 InitializeExperimentalAgc();
Bjorn Volckeradc46c42015-04-15 11:42:40 +0200352 InitializeTransient();
aluebs@webrtc.orgae643ce2014-12-19 19:57:34 +0000353 InitializeBeamformer();
peah1bcfce52016-08-26 07:16:04 -0700354#if WEBRTC_INTELLIGIBILITY_ENHANCER
ekmeyerson60d9b332015-08-14 10:35:55 -0700355 InitializeIntelligibility();
peah1bcfce52016-08-26 07:16:04 -0700356#endif
solenberg70f99032015-12-08 11:07:32 -0800357 InitializeHighPassFilter();
solenberg5e465c32015-12-08 13:22:33 -0800358 InitializeNoiseSuppression();
solenberg949028f2015-12-15 11:39:38 -0800359 InitializeLevelEstimator();
solenberga29386c2015-12-16 03:31:12 -0800360 InitializeVoiceDetection();
peahca4cac72016-06-29 15:26:12 -0700361 InitializeLevelController();
solenberg70f99032015-12-08 11:07:32 -0800362
andrew@webrtc.org7bf26462011-12-03 00:03:31 +0000363#ifdef WEBRTC_AUDIOPROC_DEBUG_DUMP
tommia6219cc2016-06-15 10:30:14 -0700364 if (debug_dump_.debug_file->is_open()) {
ajm@google.com808e0e02011-08-03 21:08:51 +0000365 int err = WriteInitMessage();
366 if (err != kNoError) {
367 return err;
368 }
369 }
andrew@webrtc.org7bf26462011-12-03 00:03:31 +0000370#endif
ajm@google.com808e0e02011-08-03 21:08:51 +0000371
niklase@google.com470e71d2011-07-07 08:21:25 +0000372 return kNoError;
373}
374
Michael Graczyk86c6d332015-07-23 11:41:39 -0700375int AudioProcessingImpl::InitializeLocked(const ProcessingConfig& config) {
376 for (const auto& stream : config.streams) {
Michael Graczyk86c6d332015-07-23 11:41:39 -0700377 if (stream.num_channels() > 0 && stream.sample_rate_hz() <= 0) {
378 return kBadSampleRateError;
379 }
andrew@webrtc.orga8b97372014-03-10 22:26:12 +0000380 }
Michael Graczyk86c6d332015-07-23 11:41:39 -0700381
Peter Kasting69558702016-01-12 16:26:35 -0800382 const size_t num_in_channels = config.input_stream().num_channels();
383 const size_t num_out_channels = config.output_stream().num_channels();
Michael Graczyk86c6d332015-07-23 11:41:39 -0700384
385 // Need at least one input channel.
386 // Need either one output channel or as many outputs as there are inputs.
387 if (num_in_channels == 0 ||
388 !(num_out_channels == 1 || num_out_channels == num_in_channels)) {
Michael Graczykc2047542015-07-22 21:06:11 -0700389 return kBadNumberChannelsError;
390 }
391
aluebsb2328d12016-01-11 20:32:29 -0800392 if (capture_nonlocked_.beamformer_enabled &&
Peter Kasting69558702016-01-12 16:26:35 -0800393 num_in_channels != capture_.array_geometry.size()) {
Michael Graczyk86c6d332015-07-23 11:41:39 -0700394 return kBadNumberChannelsError;
395 }
396
peahdf3efa82015-11-28 12:35:15 -0800397 formats_.api_format = config;
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +0000398
peah423d2362016-04-09 16:06:52 -0700399 capture_nonlocked_.fwd_proc_format = StreamConfig(ClosestHigherNativeRate(
400 std::min(formats_.api_format.input_stream().sample_rate_hz(),
401 formats_.api_format.output_stream().sample_rate_hz())));
andrew@webrtc.orga8b97372014-03-10 22:26:12 +0000402
aluebseb3603b2016-04-20 15:27:58 -0700403 int rev_proc_rate = ClosestHigherNativeRate(std::min(
404 formats_.api_format.reverse_input_stream().sample_rate_hz(),
405 formats_.api_format.reverse_output_stream().sample_rate_hz()));
406 // TODO(aluebs): Remove this restriction once we figure out why the 3-band
407 // splitting filter degrades the AEC performance.
408 if (rev_proc_rate > kSampleRate32kHz) {
409 rev_proc_rate = is_rev_processed() ? kSampleRate32kHz : kSampleRate16kHz;
410 }
411 // If the forward sample rate is 8 kHz, the reverse stream is also processed
412 // at this rate.
peahdf3efa82015-11-28 12:35:15 -0800413 if (capture_nonlocked_.fwd_proc_format.sample_rate_hz() == kSampleRate8kHz) {
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +0000414 rev_proc_rate = kSampleRate8kHz;
andrew@webrtc.orga8b97372014-03-10 22:26:12 +0000415 } else {
aluebseb3603b2016-04-20 15:27:58 -0700416 rev_proc_rate = std::max(rev_proc_rate, static_cast<int>(kSampleRate16kHz));
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +0000417 }
418
andrew@webrtc.org30be8272014-09-24 20:06:23 +0000419 // Always downmix the reverse stream to mono for analysis. This has been
420 // demonstrated to work well for AEC in most practical scenarios.
peahdf3efa82015-11-28 12:35:15 -0800421 formats_.rev_proc_format = StreamConfig(rev_proc_rate, 1);
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +0000422
peahdf3efa82015-11-28 12:35:15 -0800423 if (capture_nonlocked_.fwd_proc_format.sample_rate_hz() == kSampleRate32kHz ||
424 capture_nonlocked_.fwd_proc_format.sample_rate_hz() == kSampleRate48kHz) {
425 capture_nonlocked_.split_rate = kSampleRate16kHz;
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +0000426 } else {
peahdf3efa82015-11-28 12:35:15 -0800427 capture_nonlocked_.split_rate =
428 capture_nonlocked_.fwd_proc_format.sample_rate_hz();
andrew@webrtc.orga8b97372014-03-10 22:26:12 +0000429 }
430
431 return InitializeLocked();
432}
433
peahc8bbe3f2016-09-09 14:15:57 -0700434void AudioProcessingImpl::ApplyConfig(const AudioProcessing::Config& config) {
435 AudioProcessing::Config config_to_use = config;
436
437 bool config_ok = LevelController::Validate(config_to_use.level_controller);
438 if (!config_ok) {
439 LOG(LS_ERROR) << "AudioProcessing module config error" << std::endl
440 << "level_controller: "
441 << LevelController::ToString(config_to_use.level_controller)
442 << std::endl
443 << "Reverting to default parameter set";
444 config_to_use.level_controller = AudioProcessing::Config::LevelController();
445 }
446
447 // Run in a single-threaded manner when applying the settings.
448 rtc::CritScope cs_render(&crit_render_);
449 rtc::CritScope cs_capture(&crit_capture_);
450
451 if (config.level_controller.enabled !=
452 capture_nonlocked_.level_controller_enabled) {
453 InitializeLevelController();
454 LOG(LS_INFO) << "Level controller activated: "
455 << capture_nonlocked_.level_controller_enabled;
456 capture_nonlocked_.level_controller_enabled =
457 config.level_controller.enabled;
458 }
459}
460
461void AudioProcessingImpl::SetExtraOptions(const webrtc::Config& config) {
peahdf3efa82015-11-28 12:35:15 -0800462 // Run in a single-threaded manner when setting the extra options.
463 rtc::CritScope cs_render(&crit_render_);
464 rtc::CritScope cs_capture(&crit_capture_);
pbos@webrtc.org788acd12014-12-15 09:41:24 +0000465
peahb624d8c2016-03-05 03:01:14 -0800466 public_submodules_->echo_cancellation->SetExtraOptions(config);
467
peahdf3efa82015-11-28 12:35:15 -0800468 if (capture_.transient_suppressor_enabled !=
469 config.Get<ExperimentalNs>().enabled) {
470 capture_.transient_suppressor_enabled =
471 config.Get<ExperimentalNs>().enabled;
pbos@webrtc.org788acd12014-12-15 09:41:24 +0000472 InitializeTransient();
473 }
aluebs2a346882016-01-11 18:04:30 -0800474
peah1bcfce52016-08-26 07:16:04 -0700475#if WEBRTC_INTELLIGIBILITY_ENHANCER
Alejandro Luebsc9b0c262016-05-16 15:32:38 -0700476 if(capture_nonlocked_.intelligibility_enabled !=
477 config.Get<Intelligibility>().enabled) {
478 capture_nonlocked_.intelligibility_enabled =
479 config.Get<Intelligibility>().enabled;
480 InitializeIntelligibility();
481 }
peah1bcfce52016-08-26 07:16:04 -0700482#endif
Alejandro Luebsc9b0c262016-05-16 15:32:38 -0700483
aluebs2a346882016-01-11 18:04:30 -0800484#ifdef WEBRTC_ANDROID_PLATFORM_BUILD
aluebsb2328d12016-01-11 20:32:29 -0800485 if (capture_nonlocked_.beamformer_enabled !=
486 config.Get<Beamforming>().enabled) {
487 capture_nonlocked_.beamformer_enabled = config.Get<Beamforming>().enabled;
aluebs2a346882016-01-11 18:04:30 -0800488 if (config.Get<Beamforming>().array_geometry.size() > 1) {
489 capture_.array_geometry = config.Get<Beamforming>().array_geometry;
490 }
491 capture_.target_direction = config.Get<Beamforming>().target_direction;
492 InitializeBeamformer();
493 }
494#endif // WEBRTC_ANDROID_PLATFORM_BUILD
andrew@webrtc.org61e596f2013-07-25 18:28:29 +0000495}
496
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +0000497int AudioProcessingImpl::proc_sample_rate_hz() const {
peahdf3efa82015-11-28 12:35:15 -0800498 // Used as callback from submodules, hence locking is not allowed.
499 return capture_nonlocked_.fwd_proc_format.sample_rate_hz();
niklase@google.com470e71d2011-07-07 08:21:25 +0000500}
501
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +0000502int AudioProcessingImpl::proc_split_sample_rate_hz() const {
peahdf3efa82015-11-28 12:35:15 -0800503 // Used as callback from submodules, hence locking is not allowed.
504 return capture_nonlocked_.split_rate;
niklase@google.com470e71d2011-07-07 08:21:25 +0000505}
506
Peter Kasting69558702016-01-12 16:26:35 -0800507size_t AudioProcessingImpl::num_reverse_channels() const {
peahdf3efa82015-11-28 12:35:15 -0800508 // Used as callback from submodules, hence locking is not allowed.
509 return formats_.rev_proc_format.num_channels();
niklase@google.com470e71d2011-07-07 08:21:25 +0000510}
511
Peter Kasting69558702016-01-12 16:26:35 -0800512size_t AudioProcessingImpl::num_input_channels() const {
peahdf3efa82015-11-28 12:35:15 -0800513 // Used as callback from submodules, hence locking is not allowed.
514 return formats_.api_format.input_stream().num_channels();
niklase@google.com470e71d2011-07-07 08:21:25 +0000515}
516
Peter Kasting69558702016-01-12 16:26:35 -0800517size_t AudioProcessingImpl::num_proc_channels() const {
aluebsb2328d12016-01-11 20:32:29 -0800518 // Used as callback from submodules, hence locking is not allowed.
519 return capture_nonlocked_.beamformer_enabled ? 1 : num_output_channels();
520}
521
Peter Kasting69558702016-01-12 16:26:35 -0800522size_t AudioProcessingImpl::num_output_channels() const {
peahdf3efa82015-11-28 12:35:15 -0800523 // Used as callback from submodules, hence locking is not allowed.
524 return formats_.api_format.output_stream().num_channels();
niklase@google.com470e71d2011-07-07 08:21:25 +0000525}
526
andrew@webrtc.org17342e52014-02-12 22:28:31 +0000527void AudioProcessingImpl::set_output_will_be_muted(bool muted) {
peahdf3efa82015-11-28 12:35:15 -0800528 rtc::CritScope cs(&crit_capture_);
529 capture_.output_will_be_muted = muted;
530 if (private_submodules_->agc_manager.get()) {
531 private_submodules_->agc_manager->SetCaptureMuted(
532 capture_.output_will_be_muted);
pbos@webrtc.org788acd12014-12-15 09:41:24 +0000533 }
andrew@webrtc.org17342e52014-02-12 22:28:31 +0000534}
535
andrew@webrtc.org17342e52014-02-12 22:28:31 +0000536
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +0000537int AudioProcessingImpl::ProcessStream(const float* const* src,
Peter Kastingdce40cf2015-08-24 14:52:23 -0700538 size_t samples_per_channel,
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +0000539 int input_sample_rate_hz,
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000540 ChannelLayout input_layout,
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +0000541 int output_sample_rate_hz,
542 ChannelLayout output_layout,
543 float* const* dest) {
peah369f8282015-12-17 06:42:29 -0800544 TRACE_EVENT0("webrtc", "AudioProcessing::ProcessStream_ChannelLayout");
peahdf3efa82015-11-28 12:35:15 -0800545 StreamConfig input_stream;
546 StreamConfig output_stream;
547 {
548 // Access the formats_.api_format.input_stream beneath the capture lock.
549 // The lock must be released as it is later required in the call
550 // to ProcessStream(,,,);
551 rtc::CritScope cs(&crit_capture_);
552 input_stream = formats_.api_format.input_stream();
553 output_stream = formats_.api_format.output_stream();
554 }
555
Michael Graczyk86c6d332015-07-23 11:41:39 -0700556 input_stream.set_sample_rate_hz(input_sample_rate_hz);
557 input_stream.set_num_channels(ChannelsFromLayout(input_layout));
558 input_stream.set_has_keyboard(LayoutHasKeyboard(input_layout));
Michael Graczyk86c6d332015-07-23 11:41:39 -0700559 output_stream.set_sample_rate_hz(output_sample_rate_hz);
560 output_stream.set_num_channels(ChannelsFromLayout(output_layout));
561 output_stream.set_has_keyboard(LayoutHasKeyboard(output_layout));
562
563 if (samples_per_channel != input_stream.num_frames()) {
564 return kBadDataLengthError;
565 }
566 return ProcessStream(src, input_stream, output_stream, dest);
567}
568
569int AudioProcessingImpl::ProcessStream(const float* const* src,
570 const StreamConfig& input_config,
571 const StreamConfig& output_config,
572 float* const* dest) {
peah369f8282015-12-17 06:42:29 -0800573 TRACE_EVENT0("webrtc", "AudioProcessing::ProcessStream_StreamConfig");
peahdf3efa82015-11-28 12:35:15 -0800574 ProcessingConfig processing_config;
575 {
576 // Acquire the capture lock in order to safely call the function
577 // that retrieves the render side data. This function accesses apm
578 // getters that need the capture lock held when being called.
579 rtc::CritScope cs_capture(&crit_capture_);
580 public_submodules_->echo_cancellation->ReadQueuedRenderData();
581 public_submodules_->echo_control_mobile->ReadQueuedRenderData();
582 public_submodules_->gain_control->ReadQueuedRenderData();
583
584 if (!src || !dest) {
585 return kNullPointerError;
586 }
587
588 processing_config = formats_.api_format;
niklase@google.com470e71d2011-07-07 08:21:25 +0000589 }
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000590
Michael Graczyk86c6d332015-07-23 11:41:39 -0700591 processing_config.input_stream() = input_config;
592 processing_config.output_stream() = output_config;
593
peahdf3efa82015-11-28 12:35:15 -0800594 {
595 // Do conditional reinitialization.
596 rtc::CritScope cs_render(&crit_render_);
597 RETURN_ON_ERR(MaybeInitializeCapture(processing_config));
598 }
599 rtc::CritScope cs_capture(&crit_capture_);
Michael Graczyk86c6d332015-07-23 11:41:39 -0700600 assert(processing_config.input_stream().num_frames() ==
peahdf3efa82015-11-28 12:35:15 -0800601 formats_.api_format.input_stream().num_frames());
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000602
603#ifdef WEBRTC_AUDIOPROC_DEBUG_DUMP
tommia6219cc2016-06-15 10:30:14 -0700604 if (debug_dump_.debug_file->is_open()) {
Minyue13b96ba2015-10-03 00:39:14 +0200605 RETURN_ON_ERR(WriteConfigMessage(false));
606
peahdf3efa82015-11-28 12:35:15 -0800607 debug_dump_.capture.event_msg->set_type(audioproc::Event::STREAM);
608 audioproc::Stream* msg = debug_dump_.capture.event_msg->mutable_stream();
aluebs@webrtc.org59a1b1b2014-08-28 10:43:09 +0000609 const size_t channel_size =
peahdf3efa82015-11-28 12:35:15 -0800610 sizeof(float) * formats_.api_format.input_stream().num_frames();
Peter Kasting69558702016-01-12 16:26:35 -0800611 for (size_t i = 0; i < formats_.api_format.input_stream().num_channels();
612 ++i)
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +0000613 msg->add_input_channel(src[i], channel_size);
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000614 }
615#endif
616
peahdf3efa82015-11-28 12:35:15 -0800617 capture_.capture_audio->CopyFrom(src, formats_.api_format.input_stream());
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000618 RETURN_ON_ERR(ProcessStreamLocked());
peahdf3efa82015-11-28 12:35:15 -0800619 capture_.capture_audio->CopyTo(formats_.api_format.output_stream(), dest);
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000620
621#ifdef WEBRTC_AUDIOPROC_DEBUG_DUMP
tommia6219cc2016-06-15 10:30:14 -0700622 if (debug_dump_.debug_file->is_open()) {
peahdf3efa82015-11-28 12:35:15 -0800623 audioproc::Stream* msg = debug_dump_.capture.event_msg->mutable_stream();
aluebs@webrtc.org59a1b1b2014-08-28 10:43:09 +0000624 const size_t channel_size =
peahdf3efa82015-11-28 12:35:15 -0800625 sizeof(float) * formats_.api_format.output_stream().num_frames();
Peter Kasting69558702016-01-12 16:26:35 -0800626 for (size_t i = 0; i < formats_.api_format.output_stream().num_channels();
627 ++i)
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +0000628 msg->add_output_channel(dest[i], channel_size);
peahdf3efa82015-11-28 12:35:15 -0800629 RETURN_ON_ERR(WriteMessageToDebugFile(debug_dump_.debug_file.get(),
ivocd66b44d2016-01-15 03:06:36 -0800630 &debug_dump_.num_bytes_left_for_log_,
peahdf3efa82015-11-28 12:35:15 -0800631 &crit_debug_, &debug_dump_.capture));
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000632 }
633#endif
634
635 return kNoError;
636}
637
638int AudioProcessingImpl::ProcessStream(AudioFrame* frame) {
peah369f8282015-12-17 06:42:29 -0800639 TRACE_EVENT0("webrtc", "AudioProcessing::ProcessStream_AudioFrame");
peahdf3efa82015-11-28 12:35:15 -0800640 {
641 // Acquire the capture lock in order to safely call the function
642 // that retrieves the render side data. This function accesses apm
643 // getters that need the capture lock held when being called.
644 // The lock needs to be released as
645 // public_submodules_->echo_control_mobile->is_enabled() aquires this lock
646 // as well.
647 rtc::CritScope cs_capture(&crit_capture_);
648 public_submodules_->echo_cancellation->ReadQueuedRenderData();
649 public_submodules_->echo_control_mobile->ReadQueuedRenderData();
650 public_submodules_->gain_control->ReadQueuedRenderData();
651 }
peahfa6228e2015-11-16 16:27:42 -0800652
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000653 if (!frame) {
654 return kNullPointerError;
655 }
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +0000656 // Must be a native rate.
657 if (frame->sample_rate_hz_ != kSampleRate8kHz &&
658 frame->sample_rate_hz_ != kSampleRate16kHz &&
aluebs@webrtc.org087da132014-11-17 23:01:23 +0000659 frame->sample_rate_hz_ != kSampleRate32kHz &&
660 frame->sample_rate_hz_ != kSampleRate48kHz) {
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +0000661 return kBadSampleRateError;
662 }
peah192164e2015-11-17 02:16:45 -0800663
peahdf3efa82015-11-28 12:35:15 -0800664 ProcessingConfig processing_config;
665 {
666 // Aquire lock for the access of api_format.
667 // The lock is released immediately due to the conditional
668 // reinitialization.
669 rtc::CritScope cs_capture(&crit_capture_);
670 // TODO(ajm): The input and output rates and channels are currently
671 // constrained to be identical in the int16 interface.
672 processing_config = formats_.api_format;
673 }
Michael Graczyk86c6d332015-07-23 11:41:39 -0700674 processing_config.input_stream().set_sample_rate_hz(frame->sample_rate_hz_);
675 processing_config.input_stream().set_num_channels(frame->num_channels_);
676 processing_config.output_stream().set_sample_rate_hz(frame->sample_rate_hz_);
677 processing_config.output_stream().set_num_channels(frame->num_channels_);
678
peahdf3efa82015-11-28 12:35:15 -0800679 {
680 // Do conditional reinitialization.
681 rtc::CritScope cs_render(&crit_render_);
682 RETURN_ON_ERR(MaybeInitializeCapture(processing_config));
683 }
684 rtc::CritScope cs_capture(&crit_capture_);
peah192164e2015-11-17 02:16:45 -0800685 if (frame->samples_per_channel_ !=
peahdf3efa82015-11-28 12:35:15 -0800686 formats_.api_format.input_stream().num_frames()) {
niklase@google.com470e71d2011-07-07 08:21:25 +0000687 return kBadDataLengthError;
688 }
689
andrew@webrtc.org7bf26462011-12-03 00:03:31 +0000690#ifdef WEBRTC_AUDIOPROC_DEBUG_DUMP
tommia6219cc2016-06-15 10:30:14 -0700691 if (debug_dump_.debug_file->is_open()) {
peah644fa962016-08-18 06:48:33 -0700692 RETURN_ON_ERR(WriteConfigMessage(false));
693
peahdf3efa82015-11-28 12:35:15 -0800694 debug_dump_.capture.event_msg->set_type(audioproc::Event::STREAM);
695 audioproc::Stream* msg = debug_dump_.capture.event_msg->mutable_stream();
Michael Graczyk86c6d332015-07-23 11:41:39 -0700696 const size_t data_size =
697 sizeof(int16_t) * frame->samples_per_channel_ * frame->num_channels_;
andrew@webrtc.org63a50982012-05-02 23:56:37 +0000698 msg->set_input_data(frame->data_, data_size);
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000699 }
700#endif
701
peahdf3efa82015-11-28 12:35:15 -0800702 capture_.capture_audio->DeinterleaveFrom(frame);
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000703 RETURN_ON_ERR(ProcessStreamLocked());
aluebsdf6416a2016-03-16 18:26:35 -0700704 capture_.capture_audio->InterleaveTo(frame, output_copy_needed());
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000705
706#ifdef WEBRTC_AUDIOPROC_DEBUG_DUMP
tommia6219cc2016-06-15 10:30:14 -0700707 if (debug_dump_.debug_file->is_open()) {
peahdf3efa82015-11-28 12:35:15 -0800708 audioproc::Stream* msg = debug_dump_.capture.event_msg->mutable_stream();
Michael Graczyk86c6d332015-07-23 11:41:39 -0700709 const size_t data_size =
710 sizeof(int16_t) * frame->samples_per_channel_ * frame->num_channels_;
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000711 msg->set_output_data(frame->data_, data_size);
peahdf3efa82015-11-28 12:35:15 -0800712 RETURN_ON_ERR(WriteMessageToDebugFile(debug_dump_.debug_file.get(),
ivocd66b44d2016-01-15 03:06:36 -0800713 &debug_dump_.num_bytes_left_for_log_,
peahdf3efa82015-11-28 12:35:15 -0800714 &crit_debug_, &debug_dump_.capture));
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000715 }
716#endif
717
718 return kNoError;
719}
720
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000721int AudioProcessingImpl::ProcessStreamLocked() {
peahb58a1582016-03-15 09:34:24 -0700722 // Ensure that not both the AEC and AECM are active at the same time.
723 // TODO(peah): Simplify once the public API Enable functions for these
724 // are moved to APM.
725 RTC_DCHECK(!(public_submodules_->echo_cancellation->is_enabled() &&
726 public_submodules_->echo_control_mobile->is_enabled()));
727
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000728#ifdef WEBRTC_AUDIOPROC_DEBUG_DUMP
tommia6219cc2016-06-15 10:30:14 -0700729 if (debug_dump_.debug_file->is_open()) {
peahdf3efa82015-11-28 12:35:15 -0800730 audioproc::Stream* msg = debug_dump_.capture.event_msg->mutable_stream();
731 msg->set_delay(capture_nonlocked_.stream_delay_ms);
732 msg->set_drift(
733 public_submodules_->echo_cancellation->stream_drift_samples());
bjornv@webrtc.org63da1dd2015-02-06 19:44:21 +0000734 msg->set_level(gain_control()->stream_analog_level());
peahdf3efa82015-11-28 12:35:15 -0800735 msg->set_keypress(capture_.key_pressed);
niklase@google.com470e71d2011-07-07 08:21:25 +0000736 }
andrew@webrtc.org7bf26462011-12-03 00:03:31 +0000737#endif
niklase@google.com470e71d2011-07-07 08:21:25 +0000738
Bjorn Volcker1ca324f2015-06-29 14:57:29 +0200739 MaybeUpdateHistograms();
740
peahdf3efa82015-11-28 12:35:15 -0800741 AudioBuffer* ca = capture_.capture_audio.get(); // For brevity.
ekmeyerson60d9b332015-08-14 10:35:55 -0700742
peahbe615622016-02-13 16:40:47 -0800743 if (constants_.use_experimental_agc &&
peahdf3efa82015-11-28 12:35:15 -0800744 public_submodules_->gain_control->is_enabled()) {
745 private_submodules_->agc_manager->AnalyzePreProcess(
746 ca->channels()[0], ca->num_channels(),
747 capture_nonlocked_.fwd_proc_format.num_frames());
pbos@webrtc.org788acd12014-12-15 09:41:24 +0000748 }
749
aluebsdf6416a2016-03-16 18:26:35 -0700750 if (fwd_analysis_needed()) {
aluebs@webrtc.orgbe05c742014-11-14 22:18:10 +0000751 ca->SplitIntoFrequencyBands();
niklase@google.com470e71d2011-07-07 08:21:25 +0000752 }
753
aluebsb2328d12016-01-11 20:32:29 -0800754 if (capture_nonlocked_.beamformer_enabled) {
Alejandro Luebsf4022ff2016-07-01 17:19:09 -0700755 private_submodules_->beamformer->AnalyzeChunk(*ca->split_data_f());
756 // Discards all channels by the leftmost one.
aluebs@webrtc.orgae643ce2014-12-19 19:57:34 +0000757 ca->set_num_channels(1);
758 }
aluebs@webrtc.orgae643ce2014-12-19 19:57:34 +0000759
solenberg70f99032015-12-08 11:07:32 -0800760 public_submodules_->high_pass_filter->ProcessCaptureAudio(ca);
peahdf3efa82015-11-28 12:35:15 -0800761 RETURN_ON_ERR(public_submodules_->gain_control->AnalyzeCaptureAudio(ca));
solenberg5e465c32015-12-08 13:22:33 -0800762 public_submodules_->noise_suppression->AnalyzeCaptureAudio(ca);
peahb58a1582016-03-15 09:34:24 -0700763
764 // Ensure that the stream delay was set before the call to the
765 // AEC ProcessCaptureAudio function.
766 if (public_submodules_->echo_cancellation->is_enabled() &&
767 !was_stream_delay_set()) {
768 return AudioProcessing::kStreamParameterNotSetError;
769 }
770
771 RETURN_ON_ERR(public_submodules_->echo_cancellation->ProcessCaptureAudio(
772 ca, stream_delay_ms()));
niklase@google.com470e71d2011-07-07 08:21:25 +0000773
peahdf3efa82015-11-28 12:35:15 -0800774 if (public_submodules_->echo_control_mobile->is_enabled() &&
775 public_submodules_->noise_suppression->is_enabled()) {
andrew@webrtc.org103657b2014-04-24 18:28:56 +0000776 ca->CopyLowPassToReference();
niklase@google.com470e71d2011-07-07 08:21:25 +0000777 }
solenberg5e465c32015-12-08 13:22:33 -0800778 public_submodules_->noise_suppression->ProcessCaptureAudio(ca);
peah1bcfce52016-08-26 07:16:04 -0700779#if WEBRTC_INTELLIGIBILITY_ENHANCER
Alejandro Luebsc9b0c262016-05-16 15:32:38 -0700780 if (capture_nonlocked_.intelligibility_enabled) {
aluebsc466bad2016-02-10 12:03:00 -0800781 RTC_DCHECK(public_submodules_->noise_suppression->is_enabled());
Alejandro Luebsc9b0c262016-05-16 15:32:38 -0700782 int gain_db = public_submodules_->gain_control->is_enabled() ?
783 public_submodules_->gain_control->compression_gain_db() :
784 0;
Alejandro Luebs50411102016-06-30 15:35:41 -0700785 float gain = std::pow(10.f, gain_db / 20.f);
786 gain *= capture_nonlocked_.level_controller_enabled ?
787 private_submodules_->level_controller->GetLastGain() :
788 1.f;
aluebsc466bad2016-02-10 12:03:00 -0800789 public_submodules_->intelligibility_enhancer->SetCaptureNoiseEstimate(
Alejandro Luebs50411102016-06-30 15:35:41 -0700790 public_submodules_->noise_suppression->NoiseEstimate(), gain);
aluebsc466bad2016-02-10 12:03:00 -0800791 }
peah1bcfce52016-08-26 07:16:04 -0700792#endif
peah253534d2016-03-15 04:32:28 -0700793
794 // Ensure that the stream delay was set before the call to the
795 // AECM ProcessCaptureAudio function.
796 if (public_submodules_->echo_control_mobile->is_enabled() &&
797 !was_stream_delay_set()) {
798 return AudioProcessing::kStreamParameterNotSetError;
799 }
800
801 RETURN_ON_ERR(public_submodules_->echo_control_mobile->ProcessCaptureAudio(
802 ca, stream_delay_ms()));
803
Alejandro Luebsf4022ff2016-07-01 17:19:09 -0700804 if (capture_nonlocked_.beamformer_enabled) {
805 private_submodules_->beamformer->PostFilter(ca->split_data_f());
806 }
807
solenberga29386c2015-12-16 03:31:12 -0800808 public_submodules_->voice_detection->ProcessCaptureAudio(ca);
pbos@webrtc.org788acd12014-12-15 09:41:24 +0000809
peahbe615622016-02-13 16:40:47 -0800810 if (constants_.use_experimental_agc &&
peahdf3efa82015-11-28 12:35:15 -0800811 public_submodules_->gain_control->is_enabled() &&
aluebsb2328d12016-01-11 20:32:29 -0800812 (!capture_nonlocked_.beamformer_enabled ||
peahdf3efa82015-11-28 12:35:15 -0800813 private_submodules_->beamformer->is_target_present())) {
814 private_submodules_->agc_manager->Process(
815 ca->split_bands_const(0)[kBand0To8kHz], ca->num_frames_per_band(),
816 capture_nonlocked_.split_rate);
pbos@webrtc.org788acd12014-12-15 09:41:24 +0000817 }
peahb8fbb542016-03-15 02:28:08 -0700818 RETURN_ON_ERR(public_submodules_->gain_control->ProcessCaptureAudio(
819 ca, echo_cancellation()->stream_has_echo()));
niklase@google.com470e71d2011-07-07 08:21:25 +0000820
aluebsdf6416a2016-03-16 18:26:35 -0700821 if (fwd_synthesis_needed()) {
aluebs@webrtc.orgbe05c742014-11-14 22:18:10 +0000822 ca->MergeFrequencyBands();
niklase@google.com470e71d2011-07-07 08:21:25 +0000823 }
824
pbos@webrtc.org788acd12014-12-15 09:41:24 +0000825 // TODO(aluebs): Investigate if the transient suppression placement should be
826 // before or after the AGC.
peahdf3efa82015-11-28 12:35:15 -0800827 if (capture_.transient_suppressor_enabled) {
pbos@webrtc.org788acd12014-12-15 09:41:24 +0000828 float voice_probability =
peahdf3efa82015-11-28 12:35:15 -0800829 private_submodules_->agc_manager.get()
830 ? private_submodules_->agc_manager->voice_probability()
831 : 1.f;
pbos@webrtc.org788acd12014-12-15 09:41:24 +0000832
peahdf3efa82015-11-28 12:35:15 -0800833 public_submodules_->transient_suppressor->Suppress(
Michael Graczyk86c6d332015-07-23 11:41:39 -0700834 ca->channels_f()[0], ca->num_frames(), ca->num_channels(),
835 ca->split_bands_const_f(0)[kBand0To8kHz], ca->num_frames_per_band(),
836 ca->keyboard_data(), ca->num_keyboard_frames(), voice_probability,
peahdf3efa82015-11-28 12:35:15 -0800837 capture_.key_pressed);
pbos@webrtc.org788acd12014-12-15 09:41:24 +0000838 }
839
peahca4cac72016-06-29 15:26:12 -0700840 if (capture_nonlocked_.level_controller_enabled) {
841 private_submodules_->level_controller->Process(ca);
842 }
843
andrew@webrtc.org755b04a2011-11-15 16:57:56 +0000844 // The level estimator operates on the recombined data.
solenberg949028f2015-12-15 11:39:38 -0800845 public_submodules_->level_estimator->ProcessStream(ca);
ajm@google.com808e0e02011-08-03 21:08:51 +0000846
peahdf3efa82015-11-28 12:35:15 -0800847 capture_.was_stream_delay_set = false;
niklase@google.com470e71d2011-07-07 08:21:25 +0000848 return kNoError;
849}
850
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000851int AudioProcessingImpl::AnalyzeReverseStream(const float* const* data,
Peter Kastingdce40cf2015-08-24 14:52:23 -0700852 size_t samples_per_channel,
ekmeyerson60d9b332015-08-14 10:35:55 -0700853 int rev_sample_rate_hz,
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000854 ChannelLayout layout) {
peah369f8282015-12-17 06:42:29 -0800855 TRACE_EVENT0("webrtc", "AudioProcessing::AnalyzeReverseStream_ChannelLayout");
peahdf3efa82015-11-28 12:35:15 -0800856 rtc::CritScope cs(&crit_render_);
Michael Graczyk86c6d332015-07-23 11:41:39 -0700857 const StreamConfig reverse_config = {
ekmeyerson60d9b332015-08-14 10:35:55 -0700858 rev_sample_rate_hz, ChannelsFromLayout(layout), LayoutHasKeyboard(layout),
Michael Graczyk86c6d332015-07-23 11:41:39 -0700859 };
860 if (samples_per_channel != reverse_config.num_frames()) {
861 return kBadDataLengthError;
862 }
peahdf3efa82015-11-28 12:35:15 -0800863 return AnalyzeReverseStreamLocked(data, reverse_config, reverse_config);
ekmeyerson60d9b332015-08-14 10:35:55 -0700864}
865
866int AudioProcessingImpl::ProcessReverseStream(
867 const float* const* src,
868 const StreamConfig& reverse_input_config,
869 const StreamConfig& reverse_output_config,
870 float* const* dest) {
peah369f8282015-12-17 06:42:29 -0800871 TRACE_EVENT0("webrtc", "AudioProcessing::ProcessReverseStream_StreamConfig");
peahdf3efa82015-11-28 12:35:15 -0800872 rtc::CritScope cs(&crit_render_);
873 RETURN_ON_ERR(AnalyzeReverseStreamLocked(src, reverse_input_config,
874 reverse_output_config));
ekmeyerson60d9b332015-08-14 10:35:55 -0700875 if (is_rev_processed()) {
peahdf3efa82015-11-28 12:35:15 -0800876 render_.render_audio->CopyTo(formats_.api_format.reverse_output_stream(),
877 dest);
peah81b9bfe2015-11-27 02:47:28 -0800878 } else if (render_check_rev_conversion_needed()) {
peahdf3efa82015-11-28 12:35:15 -0800879 render_.render_converter->Convert(src, reverse_input_config.num_samples(),
880 dest,
881 reverse_output_config.num_samples());
ekmeyerson60d9b332015-08-14 10:35:55 -0700882 } else {
883 CopyAudioIfNeeded(src, reverse_input_config.num_frames(),
884 reverse_input_config.num_channels(), dest);
885 }
886
887 return kNoError;
Michael Graczyk86c6d332015-07-23 11:41:39 -0700888}
889
peahdf3efa82015-11-28 12:35:15 -0800890int AudioProcessingImpl::AnalyzeReverseStreamLocked(
ekmeyerson60d9b332015-08-14 10:35:55 -0700891 const float* const* src,
892 const StreamConfig& reverse_input_config,
893 const StreamConfig& reverse_output_config) {
peahdf3efa82015-11-28 12:35:15 -0800894 if (src == nullptr) {
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000895 return kNullPointerError;
896 }
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000897
Peter Kasting69558702016-01-12 16:26:35 -0800898 if (reverse_input_config.num_channels() == 0) {
Michael Graczyk86c6d332015-07-23 11:41:39 -0700899 return kBadNumberChannelsError;
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000900 }
901
peahdf3efa82015-11-28 12:35:15 -0800902 ProcessingConfig processing_config = formats_.api_format;
ekmeyerson60d9b332015-08-14 10:35:55 -0700903 processing_config.reverse_input_stream() = reverse_input_config;
904 processing_config.reverse_output_stream() = reverse_output_config;
Michael Graczyk86c6d332015-07-23 11:41:39 -0700905
peahdf3efa82015-11-28 12:35:15 -0800906 RETURN_ON_ERR(MaybeInitializeRender(processing_config));
ekmeyerson60d9b332015-08-14 10:35:55 -0700907 assert(reverse_input_config.num_frames() ==
peahdf3efa82015-11-28 12:35:15 -0800908 formats_.api_format.reverse_input_stream().num_frames());
Michael Graczyk86c6d332015-07-23 11:41:39 -0700909
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000910#ifdef WEBRTC_AUDIOPROC_DEBUG_DUMP
tommia6219cc2016-06-15 10:30:14 -0700911 if (debug_dump_.debug_file->is_open()) {
peahdf3efa82015-11-28 12:35:15 -0800912 debug_dump_.render.event_msg->set_type(audioproc::Event::REVERSE_STREAM);
913 audioproc::ReverseStream* msg =
914 debug_dump_.render.event_msg->mutable_reverse_stream();
aluebs@webrtc.org59a1b1b2014-08-28 10:43:09 +0000915 const size_t channel_size =
peahdf3efa82015-11-28 12:35:15 -0800916 sizeof(float) * formats_.api_format.reverse_input_stream().num_frames();
Peter Kasting69558702016-01-12 16:26:35 -0800917 for (size_t i = 0;
peahdf3efa82015-11-28 12:35:15 -0800918 i < formats_.api_format.reverse_input_stream().num_channels(); ++i)
ekmeyerson60d9b332015-08-14 10:35:55 -0700919 msg->add_channel(src[i], channel_size);
peahdf3efa82015-11-28 12:35:15 -0800920 RETURN_ON_ERR(WriteMessageToDebugFile(debug_dump_.debug_file.get(),
ivocd66b44d2016-01-15 03:06:36 -0800921 &debug_dump_.num_bytes_left_for_log_,
peahdf3efa82015-11-28 12:35:15 -0800922 &crit_debug_, &debug_dump_.render));
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000923 }
924#endif
925
peahdf3efa82015-11-28 12:35:15 -0800926 render_.render_audio->CopyFrom(src,
927 formats_.api_format.reverse_input_stream());
ekmeyerson60d9b332015-08-14 10:35:55 -0700928 return ProcessReverseStreamLocked();
929}
930
931int AudioProcessingImpl::ProcessReverseStream(AudioFrame* frame) {
peah369f8282015-12-17 06:42:29 -0800932 TRACE_EVENT0("webrtc", "AudioProcessing::ProcessReverseStream_AudioFrame");
peahdf3efa82015-11-28 12:35:15 -0800933 rtc::CritScope cs(&crit_render_);
peahdf3efa82015-11-28 12:35:15 -0800934 if (frame == nullptr) {
niklase@google.com470e71d2011-07-07 08:21:25 +0000935 return kNullPointerError;
936 }
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +0000937 // Must be a native rate.
938 if (frame->sample_rate_hz_ != kSampleRate8kHz &&
939 frame->sample_rate_hz_ != kSampleRate16kHz &&
aluebs@webrtc.org087da132014-11-17 23:01:23 +0000940 frame->sample_rate_hz_ != kSampleRate32kHz &&
941 frame->sample_rate_hz_ != kSampleRate48kHz) {
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +0000942 return kBadSampleRateError;
943 }
andrew@webrtc.orga8b97372014-03-10 22:26:12 +0000944
Michael Graczyk86c6d332015-07-23 11:41:39 -0700945 if (frame->num_channels_ <= 0) {
946 return kBadNumberChannelsError;
947 }
948
peahdf3efa82015-11-28 12:35:15 -0800949 ProcessingConfig processing_config = formats_.api_format;
ekmeyerson60d9b332015-08-14 10:35:55 -0700950 processing_config.reverse_input_stream().set_sample_rate_hz(
951 frame->sample_rate_hz_);
952 processing_config.reverse_input_stream().set_num_channels(
953 frame->num_channels_);
954 processing_config.reverse_output_stream().set_sample_rate_hz(
955 frame->sample_rate_hz_);
956 processing_config.reverse_output_stream().set_num_channels(
957 frame->num_channels_);
Michael Graczyk86c6d332015-07-23 11:41:39 -0700958
peahdf3efa82015-11-28 12:35:15 -0800959 RETURN_ON_ERR(MaybeInitializeRender(processing_config));
Michael Graczyk86c6d332015-07-23 11:41:39 -0700960 if (frame->samples_per_channel_ !=
peahdf3efa82015-11-28 12:35:15 -0800961 formats_.api_format.reverse_input_stream().num_frames()) {
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000962 return kBadDataLengthError;
963 }
niklase@google.com470e71d2011-07-07 08:21:25 +0000964
andrew@webrtc.org7bf26462011-12-03 00:03:31 +0000965#ifdef WEBRTC_AUDIOPROC_DEBUG_DUMP
tommia6219cc2016-06-15 10:30:14 -0700966 if (debug_dump_.debug_file->is_open()) {
peahdf3efa82015-11-28 12:35:15 -0800967 debug_dump_.render.event_msg->set_type(audioproc::Event::REVERSE_STREAM);
968 audioproc::ReverseStream* msg =
969 debug_dump_.render.event_msg->mutable_reverse_stream();
Michael Graczyk86c6d332015-07-23 11:41:39 -0700970 const size_t data_size =
971 sizeof(int16_t) * frame->samples_per_channel_ * frame->num_channels_;
andrew@webrtc.org63a50982012-05-02 23:56:37 +0000972 msg->set_data(frame->data_, data_size);
peahdf3efa82015-11-28 12:35:15 -0800973 RETURN_ON_ERR(WriteMessageToDebugFile(debug_dump_.debug_file.get(),
ivocd66b44d2016-01-15 03:06:36 -0800974 &debug_dump_.num_bytes_left_for_log_,
peahdf3efa82015-11-28 12:35:15 -0800975 &crit_debug_, &debug_dump_.render));
niklase@google.com470e71d2011-07-07 08:21:25 +0000976 }
andrew@webrtc.org7bf26462011-12-03 00:03:31 +0000977#endif
peahdf3efa82015-11-28 12:35:15 -0800978 render_.render_audio->DeinterleaveFrom(frame);
aluebsb0319552016-03-17 20:39:53 -0700979 RETURN_ON_ERR(ProcessReverseStreamLocked());
980 if (is_rev_processed()) {
981 render_.render_audio->InterleaveTo(frame, true);
982 }
983 return kNoError;
andrew@webrtc.org17e40642014-03-04 20:58:13 +0000984}
niklase@google.com470e71d2011-07-07 08:21:25 +0000985
ekmeyerson60d9b332015-08-14 10:35:55 -0700986int AudioProcessingImpl::ProcessReverseStreamLocked() {
peahdf3efa82015-11-28 12:35:15 -0800987 AudioBuffer* ra = render_.render_audio.get(); // For brevity.
aluebsdf6416a2016-03-16 18:26:35 -0700988 if (rev_analysis_needed()) {
aluebs@webrtc.orgbe05c742014-11-14 22:18:10 +0000989 ra->SplitIntoFrequencyBands();
niklase@google.com470e71d2011-07-07 08:21:25 +0000990 }
991
peah1bcfce52016-08-26 07:16:04 -0700992#if WEBRTC_INTELLIGIBILITY_ENHANCER
Alejandro Luebsc9b0c262016-05-16 15:32:38 -0700993 if (capture_nonlocked_.intelligibility_enabled) {
peahdf3efa82015-11-28 12:35:15 -0800994 public_submodules_->intelligibility_enhancer->ProcessRenderAudio(
995 ra->split_channels_f(kBand0To8kHz), capture_nonlocked_.split_rate,
996 ra->num_channels());
ekmeyerson60d9b332015-08-14 10:35:55 -0700997 }
peah1bcfce52016-08-26 07:16:04 -0700998#endif
ekmeyerson60d9b332015-08-14 10:35:55 -0700999
peahdf3efa82015-11-28 12:35:15 -08001000 RETURN_ON_ERR(public_submodules_->echo_cancellation->ProcessRenderAudio(ra));
1001 RETURN_ON_ERR(
1002 public_submodules_->echo_control_mobile->ProcessRenderAudio(ra));
peahbe615622016-02-13 16:40:47 -08001003 if (!constants_.use_experimental_agc) {
peahdf3efa82015-11-28 12:35:15 -08001004 RETURN_ON_ERR(public_submodules_->gain_control->ProcessRenderAudio(ra));
pbos@webrtc.org788acd12014-12-15 09:41:24 +00001005 }
niklase@google.com470e71d2011-07-07 08:21:25 +00001006
aluebsdf6416a2016-03-16 18:26:35 -07001007 if (rev_synthesis_needed()) {
ekmeyerson60d9b332015-08-14 10:35:55 -07001008 ra->MergeFrequencyBands();
1009 }
1010
andrew@webrtc.org17e40642014-03-04 20:58:13 +00001011 return kNoError;
niklase@google.com470e71d2011-07-07 08:21:25 +00001012}
1013
1014int AudioProcessingImpl::set_stream_delay_ms(int delay) {
peahdf3efa82015-11-28 12:35:15 -08001015 rtc::CritScope cs(&crit_capture_);
andrew@webrtc.org5f23d642012-05-29 21:14:06 +00001016 Error retval = kNoError;
peahdf3efa82015-11-28 12:35:15 -08001017 capture_.was_stream_delay_set = true;
1018 delay += capture_.delay_offset_ms;
andrew@webrtc.org6f9f8172012-03-06 19:03:39 +00001019
niklase@google.com470e71d2011-07-07 08:21:25 +00001020 if (delay < 0) {
andrew@webrtc.org5f23d642012-05-29 21:14:06 +00001021 delay = 0;
1022 retval = kBadStreamParameterWarning;
niklase@google.com470e71d2011-07-07 08:21:25 +00001023 }
1024
1025 // TODO(ajm): the max is rather arbitrarily chosen; investigate.
1026 if (delay > 500) {
andrew@webrtc.org5f23d642012-05-29 21:14:06 +00001027 delay = 500;
1028 retval = kBadStreamParameterWarning;
niklase@google.com470e71d2011-07-07 08:21:25 +00001029 }
1030
peahdf3efa82015-11-28 12:35:15 -08001031 capture_nonlocked_.stream_delay_ms = delay;
andrew@webrtc.org5f23d642012-05-29 21:14:06 +00001032 return retval;
niklase@google.com470e71d2011-07-07 08:21:25 +00001033}
1034
1035int AudioProcessingImpl::stream_delay_ms() const {
peahdf3efa82015-11-28 12:35:15 -08001036 // Used as callback from submodules, hence locking is not allowed.
1037 return capture_nonlocked_.stream_delay_ms;
niklase@google.com470e71d2011-07-07 08:21:25 +00001038}
1039
1040bool AudioProcessingImpl::was_stream_delay_set() const {
peahdf3efa82015-11-28 12:35:15 -08001041 // Used as callback from submodules, hence locking is not allowed.
1042 return capture_.was_stream_delay_set;
niklase@google.com470e71d2011-07-07 08:21:25 +00001043}
1044
andrew@webrtc.org17e40642014-03-04 20:58:13 +00001045void AudioProcessingImpl::set_stream_key_pressed(bool key_pressed) {
peahdf3efa82015-11-28 12:35:15 -08001046 rtc::CritScope cs(&crit_capture_);
1047 capture_.key_pressed = key_pressed;
andrew@webrtc.org17e40642014-03-04 20:58:13 +00001048}
1049
andrew@webrtc.org6f9f8172012-03-06 19:03:39 +00001050void AudioProcessingImpl::set_delay_offset_ms(int offset) {
peahdf3efa82015-11-28 12:35:15 -08001051 rtc::CritScope cs(&crit_capture_);
1052 capture_.delay_offset_ms = offset;
andrew@webrtc.org6f9f8172012-03-06 19:03:39 +00001053}
1054
1055int AudioProcessingImpl::delay_offset_ms() const {
peahdf3efa82015-11-28 12:35:15 -08001056 rtc::CritScope cs(&crit_capture_);
1057 return capture_.delay_offset_ms;
andrew@webrtc.org6f9f8172012-03-06 19:03:39 +00001058}
1059
niklase@google.com470e71d2011-07-07 08:21:25 +00001060int AudioProcessingImpl::StartDebugRecording(
ivocd66b44d2016-01-15 03:06:36 -08001061 const char filename[AudioProcessing::kMaxFilenameSize],
1062 int64_t max_log_size_bytes) {
peahdf3efa82015-11-28 12:35:15 -08001063 // Run in a single-threaded manner.
1064 rtc::CritScope cs_render(&crit_render_);
1065 rtc::CritScope cs_capture(&crit_capture_);
André Susano Pinto664cdaf2015-05-20 11:11:07 +02001066 static_assert(kMaxFilenameSize == FileWrapper::kMaxFileNameSize, "");
niklase@google.com470e71d2011-07-07 08:21:25 +00001067
peahdf3efa82015-11-28 12:35:15 -08001068 if (filename == nullptr) {
niklase@google.com470e71d2011-07-07 08:21:25 +00001069 return kNullPointerError;
1070 }
1071
andrew@webrtc.org7bf26462011-12-03 00:03:31 +00001072#ifdef WEBRTC_AUDIOPROC_DEBUG_DUMP
ivocd66b44d2016-01-15 03:06:36 -08001073 debug_dump_.num_bytes_left_for_log_ = max_log_size_bytes;
niklase@google.com470e71d2011-07-07 08:21:25 +00001074 // Stop any ongoing recording.
tommia6219cc2016-06-15 10:30:14 -07001075 debug_dump_.debug_file->CloseFile();
niklase@google.com470e71d2011-07-07 08:21:25 +00001076
tommia6219cc2016-06-15 10:30:14 -07001077 if (!debug_dump_.debug_file->OpenFile(filename, false)) {
niklase@google.com470e71d2011-07-07 08:21:25 +00001078 return kFileError;
1079 }
1080
Minyue13b96ba2015-10-03 00:39:14 +02001081 RETURN_ON_ERR(WriteConfigMessage(true));
1082 RETURN_ON_ERR(WriteInitMessage());
niklase@google.com470e71d2011-07-07 08:21:25 +00001083 return kNoError;
andrew@webrtc.org7bf26462011-12-03 00:03:31 +00001084#else
1085 return kUnsupportedFunctionError;
1086#endif // WEBRTC_AUDIOPROC_DEBUG_DUMP
niklase@google.com470e71d2011-07-07 08:21:25 +00001087}
1088
ivocd66b44d2016-01-15 03:06:36 -08001089int AudioProcessingImpl::StartDebugRecording(FILE* handle,
1090 int64_t max_log_size_bytes) {
peahdf3efa82015-11-28 12:35:15 -08001091 // Run in a single-threaded manner.
1092 rtc::CritScope cs_render(&crit_render_);
1093 rtc::CritScope cs_capture(&crit_capture_);
henrikg@webrtc.org863b5362013-12-06 16:05:17 +00001094
peahdf3efa82015-11-28 12:35:15 -08001095 if (handle == nullptr) {
henrikg@webrtc.org863b5362013-12-06 16:05:17 +00001096 return kNullPointerError;
1097 }
1098
1099#ifdef WEBRTC_AUDIOPROC_DEBUG_DUMP
ivocd66b44d2016-01-15 03:06:36 -08001100 debug_dump_.num_bytes_left_for_log_ = max_log_size_bytes;
1101
henrikg@webrtc.org863b5362013-12-06 16:05:17 +00001102 // Stop any ongoing recording.
tommia6219cc2016-06-15 10:30:14 -07001103 debug_dump_.debug_file->CloseFile();
henrikg@webrtc.org863b5362013-12-06 16:05:17 +00001104
tommia6219cc2016-06-15 10:30:14 -07001105 if (!debug_dump_.debug_file->OpenFromFileHandle(handle)) {
henrikg@webrtc.org863b5362013-12-06 16:05:17 +00001106 return kFileError;
1107 }
1108
Minyue13b96ba2015-10-03 00:39:14 +02001109 RETURN_ON_ERR(WriteConfigMessage(true));
1110 RETURN_ON_ERR(WriteInitMessage());
henrikg@webrtc.org863b5362013-12-06 16:05:17 +00001111 return kNoError;
1112#else
1113 return kUnsupportedFunctionError;
1114#endif // WEBRTC_AUDIOPROC_DEBUG_DUMP
1115}
1116
xians@webrtc.orge46bc772014-10-10 08:36:56 +00001117int AudioProcessingImpl::StartDebugRecordingForPlatformFile(
1118 rtc::PlatformFile handle) {
peahdf3efa82015-11-28 12:35:15 -08001119 // Run in a single-threaded manner.
1120 rtc::CritScope cs_render(&crit_render_);
1121 rtc::CritScope cs_capture(&crit_capture_);
xians@webrtc.orge46bc772014-10-10 08:36:56 +00001122 FILE* stream = rtc::FdopenPlatformFileForWriting(handle);
ivocd66b44d2016-01-15 03:06:36 -08001123 return StartDebugRecording(stream, -1);
xians@webrtc.orge46bc772014-10-10 08:36:56 +00001124}
1125
niklase@google.com470e71d2011-07-07 08:21:25 +00001126int AudioProcessingImpl::StopDebugRecording() {
peahdf3efa82015-11-28 12:35:15 -08001127 // Run in a single-threaded manner.
1128 rtc::CritScope cs_render(&crit_render_);
1129 rtc::CritScope cs_capture(&crit_capture_);
andrew@webrtc.org7bf26462011-12-03 00:03:31 +00001130
1131#ifdef WEBRTC_AUDIOPROC_DEBUG_DUMP
niklase@google.com470e71d2011-07-07 08:21:25 +00001132 // We just return if recording hasn't started.
tommia6219cc2016-06-15 10:30:14 -07001133 debug_dump_.debug_file->CloseFile();
niklase@google.com470e71d2011-07-07 08:21:25 +00001134 return kNoError;
andrew@webrtc.org7bf26462011-12-03 00:03:31 +00001135#else
1136 return kUnsupportedFunctionError;
1137#endif // WEBRTC_AUDIOPROC_DEBUG_DUMP
niklase@google.com470e71d2011-07-07 08:21:25 +00001138}
1139
1140EchoCancellation* AudioProcessingImpl::echo_cancellation() const {
peahdf3efa82015-11-28 12:35:15 -08001141 // Adding a lock here has no effect as it allows any access to the submodule
1142 // from the returned pointer.
peahb624d8c2016-03-05 03:01:14 -08001143 return public_submodules_->echo_cancellation.get();
niklase@google.com470e71d2011-07-07 08:21:25 +00001144}
1145
1146EchoControlMobile* AudioProcessingImpl::echo_control_mobile() const {
peahdf3efa82015-11-28 12:35:15 -08001147 // Adding a lock here has no effect as it allows any access to the submodule
1148 // from the returned pointer.
peahbb9edbd2016-03-10 12:54:25 -08001149 return public_submodules_->echo_control_mobile.get();
niklase@google.com470e71d2011-07-07 08:21:25 +00001150}
1151
1152GainControl* AudioProcessingImpl::gain_control() const {
peahdf3efa82015-11-28 12:35:15 -08001153 // Adding a lock here has no effect as it allows any access to the submodule
1154 // from the returned pointer.
peahbe615622016-02-13 16:40:47 -08001155 if (constants_.use_experimental_agc) {
1156 return public_submodules_->gain_control_for_experimental_agc.get();
pbos@webrtc.org788acd12014-12-15 09:41:24 +00001157 }
peahbfa97112016-03-10 21:09:04 -08001158 return public_submodules_->gain_control.get();
niklase@google.com470e71d2011-07-07 08:21:25 +00001159}
1160
1161HighPassFilter* AudioProcessingImpl::high_pass_filter() const {
peahdf3efa82015-11-28 12:35:15 -08001162 // Adding a lock here has no effect as it allows any access to the submodule
1163 // from the returned pointer.
solenberg70f99032015-12-08 11:07:32 -08001164 return public_submodules_->high_pass_filter.get();
niklase@google.com470e71d2011-07-07 08:21:25 +00001165}
1166
1167LevelEstimator* AudioProcessingImpl::level_estimator() const {
peahdf3efa82015-11-28 12:35:15 -08001168 // Adding a lock here has no effect as it allows any access to the submodule
1169 // from the returned pointer.
solenberg949028f2015-12-15 11:39:38 -08001170 return public_submodules_->level_estimator.get();
niklase@google.com470e71d2011-07-07 08:21:25 +00001171}
1172
1173NoiseSuppression* AudioProcessingImpl::noise_suppression() const {
peahdf3efa82015-11-28 12:35:15 -08001174 // Adding a lock here has no effect as it allows any access to the submodule
1175 // from the returned pointer.
solenberg5e465c32015-12-08 13:22:33 -08001176 return public_submodules_->noise_suppression.get();
niklase@google.com470e71d2011-07-07 08:21:25 +00001177}
1178
1179VoiceDetection* AudioProcessingImpl::voice_detection() const {
peahdf3efa82015-11-28 12:35:15 -08001180 // Adding a lock here has no effect as it allows any access to the submodule
1181 // from the returned pointer.
solenberga29386c2015-12-16 03:31:12 -08001182 return public_submodules_->voice_detection.get();
niklase@google.com470e71d2011-07-07 08:21:25 +00001183}
1184
Alejandro Luebs63a2c132016-03-31 18:04:40 -07001185bool AudioProcessingImpl::is_fwd_processed() const {
peah253d8fa2016-02-22 02:00:09 -08001186 // The beamformer, noise suppressor and highpass filter
1187 // modify the data.
1188 if (capture_nonlocked_.beamformer_enabled ||
1189 public_submodules_->high_pass_filter->is_enabled() ||
peahb624d8c2016-03-05 03:01:14 -08001190 public_submodules_->noise_suppression->is_enabled() ||
peahbb9edbd2016-03-10 12:54:25 -08001191 public_submodules_->echo_cancellation->is_enabled() ||
peahbfa97112016-03-10 21:09:04 -08001192 public_submodules_->echo_control_mobile->is_enabled() ||
1193 public_submodules_->gain_control->is_enabled()) {
aluebs@webrtc.orgae643ce2014-12-19 19:57:34 +00001194 return true;
1195 }
1196
peah253d8fa2016-02-22 02:00:09 -08001197 // The capture data is otherwise unchanged.
1198 return false;
andrew@webrtc.org7bf26462011-12-03 00:03:31 +00001199}
1200
aluebsdf6416a2016-03-16 18:26:35 -07001201bool AudioProcessingImpl::output_copy_needed() const {
andrew@webrtc.org369166a2012-04-24 18:38:03 +00001202 // Check if we've upmixed or downmixed the audio.
peahdf3efa82015-11-28 12:35:15 -08001203 return ((formats_.api_format.output_stream().num_channels() !=
1204 formats_.api_format.input_stream().num_channels()) ||
peahca4cac72016-06-29 15:26:12 -07001205 is_fwd_processed() || capture_.transient_suppressor_enabled ||
1206 capture_nonlocked_.level_controller_enabled);
andrew@webrtc.org7bf26462011-12-03 00:03:31 +00001207}
1208
aluebsdf6416a2016-03-16 18:26:35 -07001209bool AudioProcessingImpl::fwd_synthesis_needed() const {
Alejandro Luebs63a2c132016-03-31 18:04:40 -07001210 return (is_fwd_processed() &&
aluebsdf6416a2016-03-16 18:26:35 -07001211 is_multi_band(capture_nonlocked_.fwd_proc_format.sample_rate_hz()));
andrew@webrtc.org369166a2012-04-24 18:38:03 +00001212}
1213
aluebsdf6416a2016-03-16 18:26:35 -07001214bool AudioProcessingImpl::fwd_analysis_needed() const {
Alejandro Luebs63a2c132016-03-31 18:04:40 -07001215 if (!is_fwd_processed() &&
peahdf3efa82015-11-28 12:35:15 -08001216 !public_submodules_->voice_detection->is_enabled() &&
1217 !capture_.transient_suppressor_enabled) {
1218 // Only public_submodules_->level_estimator is enabled.
andrew@webrtc.org7bf26462011-12-03 00:03:31 +00001219 return false;
aluebsdf6416a2016-03-16 18:26:35 -07001220 } else if (is_multi_band(
1221 capture_nonlocked_.fwd_proc_format.sample_rate_hz())) {
peahdf3efa82015-11-28 12:35:15 -08001222 // Something besides public_submodules_->level_estimator is enabled, and we
1223 // have super-wb.
andrew@webrtc.org7bf26462011-12-03 00:03:31 +00001224 return true;
1225 }
1226 return false;
1227}
1228
ekmeyerson60d9b332015-08-14 10:35:55 -07001229bool AudioProcessingImpl::is_rev_processed() const {
peah1bcfce52016-08-26 07:16:04 -07001230#if WEBRTC_INTELLIGIBILITY_ENHANCER
Alejandro Luebsc9b0c262016-05-16 15:32:38 -07001231 return capture_nonlocked_.intelligibility_enabled;
peah1bcfce52016-08-26 07:16:04 -07001232#else
1233 return false;
1234#endif
ekmeyerson60d9b332015-08-14 10:35:55 -07001235}
1236
aluebsdf6416a2016-03-16 18:26:35 -07001237bool AudioProcessingImpl::rev_synthesis_needed() const {
1238 return (is_rev_processed() &&
aluebseb3603b2016-04-20 15:27:58 -07001239 is_multi_band(formats_.rev_proc_format.sample_rate_hz()));
aluebsdf6416a2016-03-16 18:26:35 -07001240}
1241
1242bool AudioProcessingImpl::rev_analysis_needed() const {
aluebseb3603b2016-04-20 15:27:58 -07001243 return is_multi_band(formats_.rev_proc_format.sample_rate_hz()) &&
Alejandro Luebs63a2c132016-03-31 18:04:40 -07001244 (is_rev_processed() ||
peahdc2242d2016-04-06 09:30:58 -07001245 public_submodules_->echo_cancellation
1246 ->is_enabled_render_side_query() ||
1247 public_submodules_->echo_control_mobile
1248 ->is_enabled_render_side_query() ||
1249 public_submodules_->gain_control->is_enabled_render_side_query());
aluebsdf6416a2016-03-16 18:26:35 -07001250}
1251
peah81b9bfe2015-11-27 02:47:28 -08001252bool AudioProcessingImpl::render_check_rev_conversion_needed() const {
1253 return rev_conversion_needed();
1254}
1255
ekmeyerson60d9b332015-08-14 10:35:55 -07001256bool AudioProcessingImpl::rev_conversion_needed() const {
peahdf3efa82015-11-28 12:35:15 -08001257 return (formats_.api_format.reverse_input_stream() !=
1258 formats_.api_format.reverse_output_stream());
ekmeyerson60d9b332015-08-14 10:35:55 -07001259}
1260
Bjorn Volckeradc46c42015-04-15 11:42:40 +02001261void AudioProcessingImpl::InitializeExperimentalAgc() {
peahbe615622016-02-13 16:40:47 -08001262 if (constants_.use_experimental_agc) {
peahdf3efa82015-11-28 12:35:15 -08001263 if (!private_submodules_->agc_manager.get()) {
1264 private_submodules_->agc_manager.reset(new AgcManagerDirect(
peahbfa97112016-03-10 21:09:04 -08001265 public_submodules_->gain_control.get(),
peahbe615622016-02-13 16:40:47 -08001266 public_submodules_->gain_control_for_experimental_agc.get(),
peahdf3efa82015-11-28 12:35:15 -08001267 constants_.agc_startup_min_volume));
pbos@webrtc.org788acd12014-12-15 09:41:24 +00001268 }
peahdf3efa82015-11-28 12:35:15 -08001269 private_submodules_->agc_manager->Initialize();
1270 private_submodules_->agc_manager->SetCaptureMuted(
1271 capture_.output_will_be_muted);
pbos@webrtc.org788acd12014-12-15 09:41:24 +00001272 }
pbos@webrtc.org788acd12014-12-15 09:41:24 +00001273}
1274
Bjorn Volckeradc46c42015-04-15 11:42:40 +02001275void AudioProcessingImpl::InitializeTransient() {
peahdf3efa82015-11-28 12:35:15 -08001276 if (capture_.transient_suppressor_enabled) {
1277 if (!public_submodules_->transient_suppressor.get()) {
1278 public_submodules_->transient_suppressor.reset(new TransientSuppressor());
pbos@webrtc.org788acd12014-12-15 09:41:24 +00001279 }
peahdf3efa82015-11-28 12:35:15 -08001280 public_submodules_->transient_suppressor->Initialize(
1281 capture_nonlocked_.fwd_proc_format.sample_rate_hz(),
1282 capture_nonlocked_.split_rate,
aluebsb2328d12016-01-11 20:32:29 -08001283 num_proc_channels());
pbos@webrtc.org788acd12014-12-15 09:41:24 +00001284 }
pbos@webrtc.org788acd12014-12-15 09:41:24 +00001285}
1286
aluebs@webrtc.orgae643ce2014-12-19 19:57:34 +00001287void AudioProcessingImpl::InitializeBeamformer() {
aluebsb2328d12016-01-11 20:32:29 -08001288 if (capture_nonlocked_.beamformer_enabled) {
peahdf3efa82015-11-28 12:35:15 -08001289 if (!private_submodules_->beamformer) {
1290 private_submodules_->beamformer.reset(new NonlinearBeamformer(
Alejandro Luebsf4022ff2016-07-01 17:19:09 -07001291 capture_.array_geometry, 1u, capture_.target_direction));
aluebs@webrtc.orgd82f55d2015-01-15 18:07:21 +00001292 }
peahdf3efa82015-11-28 12:35:15 -08001293 private_submodules_->beamformer->Initialize(kChunkSizeMs,
1294 capture_nonlocked_.split_rate);
aluebs@webrtc.orgae643ce2014-12-19 19:57:34 +00001295 }
1296}
1297
ekmeyerson60d9b332015-08-14 10:35:55 -07001298void AudioProcessingImpl::InitializeIntelligibility() {
peah1bcfce52016-08-26 07:16:04 -07001299#if WEBRTC_INTELLIGIBILITY_ENHANCER
Alejandro Luebsc9b0c262016-05-16 15:32:38 -07001300 if (capture_nonlocked_.intelligibility_enabled) {
peahdf3efa82015-11-28 12:35:15 -08001301 public_submodules_->intelligibility_enhancer.reset(
Alejandro Luebs18fcbcf2016-02-22 15:57:38 -08001302 new IntelligibilityEnhancer(capture_nonlocked_.split_rate,
Alex Luebs57ae8292016-03-09 16:24:34 +01001303 render_.render_audio->num_channels(),
1304 NoiseSuppressionImpl::num_noise_bins()));
ekmeyerson60d9b332015-08-14 10:35:55 -07001305 }
peah1bcfce52016-08-26 07:16:04 -07001306#endif
ekmeyerson60d9b332015-08-14 10:35:55 -07001307}
1308
solenberg70f99032015-12-08 11:07:32 -08001309void AudioProcessingImpl::InitializeHighPassFilter() {
aluebsb2328d12016-01-11 20:32:29 -08001310 public_submodules_->high_pass_filter->Initialize(num_proc_channels(),
solenberg70f99032015-12-08 11:07:32 -08001311 proc_sample_rate_hz());
1312}
1313
solenberg5e465c32015-12-08 13:22:33 -08001314void AudioProcessingImpl::InitializeNoiseSuppression() {
aluebsb2328d12016-01-11 20:32:29 -08001315 public_submodules_->noise_suppression->Initialize(num_proc_channels(),
solenberg5e465c32015-12-08 13:22:33 -08001316 proc_sample_rate_hz());
1317}
1318
peahb624d8c2016-03-05 03:01:14 -08001319void AudioProcessingImpl::InitializeEchoCanceller() {
peahb58a1582016-03-15 09:34:24 -07001320 public_submodules_->echo_cancellation->Initialize(
1321 proc_sample_rate_hz(), num_reverse_channels(), num_output_channels(),
1322 num_proc_channels());
peahb624d8c2016-03-05 03:01:14 -08001323}
1324
peahbfa97112016-03-10 21:09:04 -08001325void AudioProcessingImpl::InitializeGainController() {
peahb8fbb542016-03-15 02:28:08 -07001326 public_submodules_->gain_control->Initialize(num_proc_channels(),
1327 proc_sample_rate_hz());
peahbfa97112016-03-10 21:09:04 -08001328}
1329
peahbb9edbd2016-03-10 12:54:25 -08001330void AudioProcessingImpl::InitializeEchoControlMobile() {
peah253534d2016-03-15 04:32:28 -07001331 public_submodules_->echo_control_mobile->Initialize(
aluebs776593b2016-03-15 14:04:58 -07001332 proc_split_sample_rate_hz(),
1333 num_reverse_channels(),
1334 num_output_channels());
peahbb9edbd2016-03-10 12:54:25 -08001335}
1336
solenberg949028f2015-12-15 11:39:38 -08001337void AudioProcessingImpl::InitializeLevelEstimator() {
1338 public_submodules_->level_estimator->Initialize();
1339}
1340
peahca4cac72016-06-29 15:26:12 -07001341void AudioProcessingImpl::InitializeLevelController() {
1342 private_submodules_->level_controller->Initialize(proc_sample_rate_hz());
1343}
1344
solenberga29386c2015-12-16 03:31:12 -08001345void AudioProcessingImpl::InitializeVoiceDetection() {
1346 public_submodules_->voice_detection->Initialize(proc_split_sample_rate_hz());
1347}
1348
Bjorn Volcker1ca324f2015-06-29 14:57:29 +02001349void AudioProcessingImpl::MaybeUpdateHistograms() {
Bjorn Volckerd92f2672015-07-05 10:46:01 +02001350 static const int kMinDiffDelayMs = 60;
Bjorn Volcker1ca324f2015-06-29 14:57:29 +02001351
1352 if (echo_cancellation()->is_enabled()) {
Bjorn Volcker4e7aa432015-07-07 11:50:05 +02001353 // Activate delay_jumps_ counters if we know echo_cancellation is runnning.
1354 // If a stream has echo we know that the echo_cancellation is in process.
peahdf3efa82015-11-28 12:35:15 -08001355 if (capture_.stream_delay_jumps == -1 &&
Bjorn Volcker4e7aa432015-07-07 11:50:05 +02001356 echo_cancellation()->stream_has_echo()) {
peahdf3efa82015-11-28 12:35:15 -08001357 capture_.stream_delay_jumps = 0;
1358 }
1359 if (capture_.aec_system_delay_jumps == -1 &&
1360 echo_cancellation()->stream_has_echo()) {
1361 capture_.aec_system_delay_jumps = 0;
Bjorn Volcker4e7aa432015-07-07 11:50:05 +02001362 }
1363
Bjorn Volcker1ca324f2015-06-29 14:57:29 +02001364 // Detect a jump in platform reported system delay and log the difference.
peahdf3efa82015-11-28 12:35:15 -08001365 const int diff_stream_delay_ms =
1366 capture_nonlocked_.stream_delay_ms - capture_.last_stream_delay_ms;
1367 if (diff_stream_delay_ms > kMinDiffDelayMs &&
1368 capture_.last_stream_delay_ms != 0) {
asaperssona2c58e22016-03-07 01:52:59 -08001369 RTC_HISTOGRAM_COUNTS("WebRTC.Audio.PlatformReportedStreamDelayJump",
1370 diff_stream_delay_ms, kMinDiffDelayMs, 1000, 100);
peahdf3efa82015-11-28 12:35:15 -08001371 if (capture_.stream_delay_jumps == -1) {
1372 capture_.stream_delay_jumps = 0; // Activate counter if needed.
Bjorn Volcker4e7aa432015-07-07 11:50:05 +02001373 }
peahdf3efa82015-11-28 12:35:15 -08001374 capture_.stream_delay_jumps++;
Bjorn Volcker1ca324f2015-06-29 14:57:29 +02001375 }
peahdf3efa82015-11-28 12:35:15 -08001376 capture_.last_stream_delay_ms = capture_nonlocked_.stream_delay_ms;
Bjorn Volcker1ca324f2015-06-29 14:57:29 +02001377
1378 // Detect a jump in AEC system delay and log the difference.
peah20028c42016-03-04 11:50:54 -08001379 const int samples_per_ms =
peahdf3efa82015-11-28 12:35:15 -08001380 rtc::CheckedDivExact(capture_nonlocked_.split_rate, 1000);
peah20028c42016-03-04 11:50:54 -08001381 RTC_DCHECK_LT(0, samples_per_ms);
Bjorn Volcker1ca324f2015-06-29 14:57:29 +02001382 const int aec_system_delay_ms =
peah20028c42016-03-04 11:50:54 -08001383 public_submodules_->echo_cancellation->GetSystemDelayInSamples() /
1384 samples_per_ms;
Michael Graczyk86c6d332015-07-23 11:41:39 -07001385 const int diff_aec_system_delay_ms =
peahdf3efa82015-11-28 12:35:15 -08001386 aec_system_delay_ms - capture_.last_aec_system_delay_ms;
Bjorn Volcker1ca324f2015-06-29 14:57:29 +02001387 if (diff_aec_system_delay_ms > kMinDiffDelayMs &&
peahdf3efa82015-11-28 12:35:15 -08001388 capture_.last_aec_system_delay_ms != 0) {
asaperssona2c58e22016-03-07 01:52:59 -08001389 RTC_HISTOGRAM_COUNTS("WebRTC.Audio.AecSystemDelayJump",
1390 diff_aec_system_delay_ms, kMinDiffDelayMs, 1000,
1391 100);
peahdf3efa82015-11-28 12:35:15 -08001392 if (capture_.aec_system_delay_jumps == -1) {
1393 capture_.aec_system_delay_jumps = 0; // Activate counter if needed.
Bjorn Volcker4e7aa432015-07-07 11:50:05 +02001394 }
peahdf3efa82015-11-28 12:35:15 -08001395 capture_.aec_system_delay_jumps++;
Bjorn Volcker1ca324f2015-06-29 14:57:29 +02001396 }
peahdf3efa82015-11-28 12:35:15 -08001397 capture_.last_aec_system_delay_ms = aec_system_delay_ms;
Bjorn Volcker1ca324f2015-06-29 14:57:29 +02001398 }
1399}
1400
Bjorn Volcker4e7aa432015-07-07 11:50:05 +02001401void AudioProcessingImpl::UpdateHistogramsOnCallEnd() {
peahdf3efa82015-11-28 12:35:15 -08001402 // Run in a single-threaded manner.
1403 rtc::CritScope cs_render(&crit_render_);
1404 rtc::CritScope cs_capture(&crit_capture_);
1405
1406 if (capture_.stream_delay_jumps > -1) {
asaperssona2c58e22016-03-07 01:52:59 -08001407 RTC_HISTOGRAM_ENUMERATION(
Bjorn Volcker4e7aa432015-07-07 11:50:05 +02001408 "WebRTC.Audio.NumOfPlatformReportedStreamDelayJumps",
peahdf3efa82015-11-28 12:35:15 -08001409 capture_.stream_delay_jumps, 51);
Bjorn Volcker4e7aa432015-07-07 11:50:05 +02001410 }
peahdf3efa82015-11-28 12:35:15 -08001411 capture_.stream_delay_jumps = -1;
1412 capture_.last_stream_delay_ms = 0;
Bjorn Volcker4e7aa432015-07-07 11:50:05 +02001413
peahdf3efa82015-11-28 12:35:15 -08001414 if (capture_.aec_system_delay_jumps > -1) {
asaperssona2c58e22016-03-07 01:52:59 -08001415 RTC_HISTOGRAM_ENUMERATION("WebRTC.Audio.NumOfAecSystemDelayJumps",
1416 capture_.aec_system_delay_jumps, 51);
Bjorn Volcker4e7aa432015-07-07 11:50:05 +02001417 }
peahdf3efa82015-11-28 12:35:15 -08001418 capture_.aec_system_delay_jumps = -1;
1419 capture_.last_aec_system_delay_ms = 0;
Bjorn Volcker4e7aa432015-07-07 11:50:05 +02001420}
1421
andrew@webrtc.org7bf26462011-12-03 00:03:31 +00001422#ifdef WEBRTC_AUDIOPROC_DEBUG_DUMP
peahdf3efa82015-11-28 12:35:15 -08001423int AudioProcessingImpl::WriteMessageToDebugFile(
1424 FileWrapper* debug_file,
ivocd66b44d2016-01-15 03:06:36 -08001425 int64_t* filesize_limit_bytes,
peahdf3efa82015-11-28 12:35:15 -08001426 rtc::CriticalSection* crit_debug,
1427 ApmDebugDumpThreadState* debug_state) {
1428 int32_t size = debug_state->event_msg->ByteSize();
ajm@google.com808e0e02011-08-03 21:08:51 +00001429 if (size <= 0) {
1430 return kUnspecifiedError;
1431 }
andrew@webrtc.org621df672013-10-22 10:27:23 +00001432#if defined(WEBRTC_ARCH_BIG_ENDIAN)
Michael Graczyk86c6d332015-07-23 11:41:39 -07001433// TODO(ajm): Use little-endian "on the wire". For the moment, we can be
1434// pretty safe in assuming little-endian.
ajm@google.com808e0e02011-08-03 21:08:51 +00001435#endif
1436
peahdf3efa82015-11-28 12:35:15 -08001437 if (!debug_state->event_msg->SerializeToString(&debug_state->event_str)) {
ajm@google.com808e0e02011-08-03 21:08:51 +00001438 return kUnspecifiedError;
1439 }
1440
peahdf3efa82015-11-28 12:35:15 -08001441 {
1442 // Ensure atomic writes of the message.
ivocd66b44d2016-01-15 03:06:36 -08001443 rtc::CritScope cs_debug(crit_debug);
1444
tommia6219cc2016-06-15 10:30:14 -07001445 RTC_DCHECK(debug_file->is_open());
ivocd66b44d2016-01-15 03:06:36 -08001446 // Update the byte counter.
1447 if (*filesize_limit_bytes >= 0) {
1448 *filesize_limit_bytes -=
1449 (sizeof(int32_t) + debug_state->event_str.length());
1450 if (*filesize_limit_bytes < 0) {
1451 // Not enough bytes are left to write this message, so stop logging.
1452 debug_file->CloseFile();
1453 return kNoError;
1454 }
1455 }
peahdf3efa82015-11-28 12:35:15 -08001456 // Write message preceded by its size.
1457 if (!debug_file->Write(&size, sizeof(int32_t))) {
1458 return kFileError;
1459 }
1460 if (!debug_file->Write(debug_state->event_str.data(),
1461 debug_state->event_str.length())) {
1462 return kFileError;
1463 }
ajm@google.com808e0e02011-08-03 21:08:51 +00001464 }
1465
peahdf3efa82015-11-28 12:35:15 -08001466 debug_state->event_msg->Clear();
ajm@google.com808e0e02011-08-03 21:08:51 +00001467
andrew@webrtc.org17e40642014-03-04 20:58:13 +00001468 return kNoError;
ajm@google.com808e0e02011-08-03 21:08:51 +00001469}
1470
1471int AudioProcessingImpl::WriteInitMessage() {
peahdf3efa82015-11-28 12:35:15 -08001472 debug_dump_.capture.event_msg->set_type(audioproc::Event::INIT);
1473 audioproc::Init* msg = debug_dump_.capture.event_msg->mutable_init();
1474 msg->set_sample_rate(formats_.api_format.input_stream().sample_rate_hz());
ajm@google.com808e0e02011-08-03 21:08:51 +00001475
Peter Kasting69558702016-01-12 16:26:35 -08001476 msg->set_num_input_channels(static_cast<google::protobuf::int32>(
1477 formats_.api_format.input_stream().num_channels()));
1478 msg->set_num_output_channels(static_cast<google::protobuf::int32>(
1479 formats_.api_format.output_stream().num_channels()));
1480 msg->set_num_reverse_channels(static_cast<google::protobuf::int32>(
1481 formats_.api_format.reverse_input_stream().num_channels()));
peahdf3efa82015-11-28 12:35:15 -08001482 msg->set_reverse_sample_rate(
1483 formats_.api_format.reverse_input_stream().sample_rate_hz());
1484 msg->set_output_sample_rate(
1485 formats_.api_format.output_stream().sample_rate_hz());
peahc7bdf8a2016-04-11 07:05:53 -07001486 msg->set_reverse_output_sample_rate(
1487 formats_.api_format.reverse_output_stream().sample_rate_hz());
1488 msg->set_num_reverse_output_channels(
1489 formats_.api_format.reverse_output_stream().num_channels());
peahdf3efa82015-11-28 12:35:15 -08001490
1491 RETURN_ON_ERR(WriteMessageToDebugFile(debug_dump_.debug_file.get(),
ivocd66b44d2016-01-15 03:06:36 -08001492 &debug_dump_.num_bytes_left_for_log_,
peahdf3efa82015-11-28 12:35:15 -08001493 &crit_debug_, &debug_dump_.capture));
Minyue13b96ba2015-10-03 00:39:14 +02001494 return kNoError;
1495}
1496
1497int AudioProcessingImpl::WriteConfigMessage(bool forced) {
1498 audioproc::Config config;
1499
peahdf3efa82015-11-28 12:35:15 -08001500 config.set_aec_enabled(public_submodules_->echo_cancellation->is_enabled());
Minyue13b96ba2015-10-03 00:39:14 +02001501 config.set_aec_delay_agnostic_enabled(
peahdf3efa82015-11-28 12:35:15 -08001502 public_submodules_->echo_cancellation->is_delay_agnostic_enabled());
Minyue13b96ba2015-10-03 00:39:14 +02001503 config.set_aec_drift_compensation_enabled(
peahdf3efa82015-11-28 12:35:15 -08001504 public_submodules_->echo_cancellation->is_drift_compensation_enabled());
Minyue13b96ba2015-10-03 00:39:14 +02001505 config.set_aec_extended_filter_enabled(
peahdf3efa82015-11-28 12:35:15 -08001506 public_submodules_->echo_cancellation->is_extended_filter_enabled());
1507 config.set_aec_suppression_level(static_cast<int>(
1508 public_submodules_->echo_cancellation->suppression_level()));
Minyue13b96ba2015-10-03 00:39:14 +02001509
peahdf3efa82015-11-28 12:35:15 -08001510 config.set_aecm_enabled(
1511 public_submodules_->echo_control_mobile->is_enabled());
Minyue13b96ba2015-10-03 00:39:14 +02001512 config.set_aecm_comfort_noise_enabled(
peahdf3efa82015-11-28 12:35:15 -08001513 public_submodules_->echo_control_mobile->is_comfort_noise_enabled());
1514 config.set_aecm_routing_mode(static_cast<int>(
1515 public_submodules_->echo_control_mobile->routing_mode()));
Minyue13b96ba2015-10-03 00:39:14 +02001516
peahdf3efa82015-11-28 12:35:15 -08001517 config.set_agc_enabled(public_submodules_->gain_control->is_enabled());
1518 config.set_agc_mode(
1519 static_cast<int>(public_submodules_->gain_control->mode()));
1520 config.set_agc_limiter_enabled(
1521 public_submodules_->gain_control->is_limiter_enabled());
peahbe615622016-02-13 16:40:47 -08001522 config.set_noise_robust_agc_enabled(constants_.use_experimental_agc);
Minyue13b96ba2015-10-03 00:39:14 +02001523
peahdf3efa82015-11-28 12:35:15 -08001524 config.set_hpf_enabled(public_submodules_->high_pass_filter->is_enabled());
Minyue13b96ba2015-10-03 00:39:14 +02001525
peahdf3efa82015-11-28 12:35:15 -08001526 config.set_ns_enabled(public_submodules_->noise_suppression->is_enabled());
1527 config.set_ns_level(
1528 static_cast<int>(public_submodules_->noise_suppression->level()));
Minyue13b96ba2015-10-03 00:39:14 +02001529
peahdf3efa82015-11-28 12:35:15 -08001530 config.set_transient_suppression_enabled(
1531 capture_.transient_suppressor_enabled);
Alejandro Luebsc9b0c262016-05-16 15:32:38 -07001532 config.set_intelligibility_enhancer_enabled(
1533 capture_nonlocked_.intelligibility_enabled);
Minyue13b96ba2015-10-03 00:39:14 +02001534
peah7789fe72016-04-15 01:19:44 -07001535 std::string experiments_description =
1536 public_submodules_->echo_cancellation->GetExperimentsDescription();
1537 // TODO(peah): Add semicolon-separated concatenations of experiment
1538 // descriptions for other submodules.
peahca4cac72016-06-29 15:26:12 -07001539 if (capture_nonlocked_.level_controller_enabled) {
1540 experiments_description += "LevelController;";
1541 }
peah7789fe72016-04-15 01:19:44 -07001542 config.set_experiments_description(experiments_description);
1543
Minyue13b96ba2015-10-03 00:39:14 +02001544 std::string serialized_config = config.SerializeAsString();
peahdf3efa82015-11-28 12:35:15 -08001545 if (!forced &&
1546 debug_dump_.capture.last_serialized_config == serialized_config) {
Minyue13b96ba2015-10-03 00:39:14 +02001547 return kNoError;
ajm@google.com808e0e02011-08-03 21:08:51 +00001548 }
1549
peahdf3efa82015-11-28 12:35:15 -08001550 debug_dump_.capture.last_serialized_config = serialized_config;
Minyue13b96ba2015-10-03 00:39:14 +02001551
peahdf3efa82015-11-28 12:35:15 -08001552 debug_dump_.capture.event_msg->set_type(audioproc::Event::CONFIG);
1553 debug_dump_.capture.event_msg->mutable_config()->CopyFrom(config);
Minyue13b96ba2015-10-03 00:39:14 +02001554
peahdf3efa82015-11-28 12:35:15 -08001555 RETURN_ON_ERR(WriteMessageToDebugFile(debug_dump_.debug_file.get(),
ivocd66b44d2016-01-15 03:06:36 -08001556 &debug_dump_.num_bytes_left_for_log_,
peahdf3efa82015-11-28 12:35:15 -08001557 &crit_debug_, &debug_dump_.capture));
ajm@google.com808e0e02011-08-03 21:08:51 +00001558 return kNoError;
1559}
andrew@webrtc.org7bf26462011-12-03 00:03:31 +00001560#endif // WEBRTC_AUDIOPROC_DEBUG_DUMP
andrew@webrtc.orgddbb8a22014-04-22 21:00:04 +00001561
kwiberg83ffe452016-08-29 14:46:07 -07001562AudioProcessingImpl::ApmCaptureState::ApmCaptureState(
1563 bool transient_suppressor_enabled,
1564 const std::vector<Point>& array_geometry,
1565 SphericalPointf target_direction)
1566 : aec_system_delay_jumps(-1),
1567 delay_offset_ms(0),
1568 was_stream_delay_set(false),
1569 last_stream_delay_ms(0),
1570 last_aec_system_delay_ms(0),
1571 stream_delay_jumps(-1),
1572 output_will_be_muted(false),
1573 key_pressed(false),
1574 transient_suppressor_enabled(transient_suppressor_enabled),
1575 array_geometry(array_geometry),
1576 target_direction(target_direction),
1577 fwd_proc_format(kSampleRate16kHz),
1578 split_rate(kSampleRate16kHz) {}
1579
1580AudioProcessingImpl::ApmCaptureState::~ApmCaptureState() = default;
1581
1582AudioProcessingImpl::ApmRenderState::ApmRenderState() = default;
1583
1584AudioProcessingImpl::ApmRenderState::~ApmRenderState() = default;
1585
niklase@google.com470e71d2011-07-07 08:21:25 +00001586} // namespace webrtc