blob: edb6db68b50857196eaaf0d1774c963fe29a462b [file] [log] [blame]
peah522d71b2017-02-23 05:16:26 -08001/*
2 * Copyright (c) 2017 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020011#ifndef MODULES_AUDIO_PROCESSING_AEC3_AEC_STATE_H_
12#define MODULES_AUDIO_PROCESSING_AEC3_AEC_STATE_H_
peah522d71b2017-02-23 05:16:26 -080013
14#include <algorithm>
15#include <memory>
16#include <vector>
17
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020018#include "api/array_view.h"
Gustaf Ullberg3646f972018-02-14 15:19:04 +010019#include "api/audio/echo_canceller3_config.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020020#include "api/optional.h"
21#include "modules/audio_processing/aec3/aec3_common.h"
Per Åhgren3ab308f2018-02-21 08:46:03 +010022#include "modules/audio_processing/aec3/delay_estimate.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020023#include "modules/audio_processing/aec3/echo_path_variability.h"
24#include "modules/audio_processing/aec3/erl_estimator.h"
25#include "modules/audio_processing/aec3/erle_estimator.h"
26#include "modules/audio_processing/aec3/render_buffer.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020027#include "rtc_base/constructormagic.h"
peah522d71b2017-02-23 05:16:26 -080028
29namespace webrtc {
30
31class ApmDataDumper;
32
33// Handles the state and the conditions for the echo removal functionality.
34class AecState {
35 public:
Gustaf Ullbergbd83b912017-10-18 12:32:42 +020036 explicit AecState(const EchoCanceller3Config& config);
peah522d71b2017-02-23 05:16:26 -080037 ~AecState();
38
Per Åhgren4b3bc0f2017-12-20 15:26:13 +010039 // Returns whether the echo subtractor can be used to determine the residual
40 // echo.
peah522d71b2017-02-23 05:16:26 -080041 bool UsableLinearEstimate() const { return usable_linear_estimate_; }
42
43 // Returns whether there has been echo leakage detected.
44 bool EchoLeakageDetected() const { return echo_leakage_detected_; }
45
peah522d71b2017-02-23 05:16:26 -080046 // Returns whether the render signal is currently active.
Per Åhgren4b3bc0f2017-12-20 15:26:13 +010047 bool ActiveRender() const { return blocks_with_active_render_ > 200; }
peahebe77782017-02-27 07:29:21 -080048
peah522d71b2017-02-23 05:16:26 -080049 // Returns the ERLE.
50 const std::array<float, kFftLengthBy2Plus1>& Erle() const {
51 return erle_estimator_.Erle();
52 }
53
Gustaf Ullberg332150d2017-11-22 14:17:39 +010054 // Returns the time-domain ERLE.
55 float ErleTimeDomain() const { return erle_estimator_.ErleTimeDomain(); }
56
peah522d71b2017-02-23 05:16:26 -080057 // Returns the ERL.
58 const std::array<float, kFftLengthBy2Plus1>& Erl() const {
59 return erl_estimator_.Erl();
60 }
61
Gustaf Ullberg332150d2017-11-22 14:17:39 +010062 // Returns the time-domain ERL.
63 float ErlTimeDomain() const { return erl_estimator_.ErlTimeDomain(); }
64
peah522d71b2017-02-23 05:16:26 -080065 // Returns the delay estimate based on the linear filter.
Per Åhgren0e6d2f52017-12-20 22:19:56 +010066 int FilterDelay() const { return filter_delay_; }
peah522d71b2017-02-23 05:16:26 -080067
peah522d71b2017-02-23 05:16:26 -080068 // Returns whether the capture signal is saturated.
69 bool SaturatedCapture() const { return capture_signal_saturation_; }
70
peah86afe9d2017-04-06 15:45:32 -070071 // Returns whether the echo signal is saturated.
72 bool SaturatedEcho() const { return echo_saturation_; }
73
Per Åhgren7ddd4632017-10-25 02:59:45 +020074 // Returns whether the echo path can saturate.
75 bool SaturatingEchoPath() const { return saturating_echo_path_; }
76
peah522d71b2017-02-23 05:16:26 -080077 // Updates the capture signal saturation.
78 void UpdateCaptureSaturation(bool capture_signal_saturation) {
79 capture_signal_saturation_ = capture_signal_saturation;
80 }
81
Per Åhgren1b4059e2017-10-15 20:19:21 +020082 // Returns whether the transparent mode is active
83 bool TransparentMode() const { return transparent_mode_; }
peah522d71b2017-02-23 05:16:26 -080084
peah86afe9d2017-04-06 15:45:32 -070085 // Takes appropriate action at an echo path change.
86 void HandleEchoPathChange(const EchoPathVariability& echo_path_variability);
87
peah89420452017-04-07 06:13:39 -070088 // Returns the decay factor for the echo reverberation.
peah29103572017-07-11 02:54:02 -070089 float ReverbDecay() const { return reverb_decay_; }
peah89420452017-04-07 06:13:39 -070090
Per Åhgrenb6b00dc2018-02-20 22:18:27 +010091 // Returns the upper limit for the echo suppression gain.
92 float SuppressionGainLimit() const { return suppressor_gain_limit_; }
peah6d822ad2017-04-10 13:52:14 -070093
peah29103572017-07-11 02:54:02 -070094 // Returns whether the echo in the capture signal is audible.
95 bool InaudibleEcho() const { return echo_audibility_.InaudibleEcho(); }
96
97 // Updates the aec state with the AEC output signal.
98 void UpdateWithOutput(rtc::ArrayView<const float> e) {
99 echo_audibility_.UpdateWithOutput(e);
100 }
101
Per Åhgren4b3bc0f2017-12-20 15:26:13 +0100102 // Returns whether the linear filter should have been able to properly adapt.
103 bool FilterHasHadTimeToConverge() const {
104 return filter_has_had_time_to_converge_;
105 }
Per Åhgren1b4059e2017-10-15 20:19:21 +0200106
Per Åhgrena98c8072018-01-15 19:17:16 +0100107 // Returns whether the filter adaptation is still in the initial state.
108 bool InitialState() const { return initial_state_; }
109
peah522d71b2017-02-23 05:16:26 -0800110 // Updates the aec state.
Per Åhgren3ab308f2018-02-21 08:46:03 +0100111 void Update(const rtc::Optional<DelayEstimate>& delay_estimate,
112 const std::vector<std::array<float, kFftLengthBy2Plus1>>&
peah86afe9d2017-04-06 15:45:32 -0700113 adaptive_filter_frequency_response,
Per Åhgren09a718a2017-12-11 22:28:45 +0100114 const std::vector<float>& adaptive_filter_impulse_response,
Per Åhgren1b4059e2017-10-15 20:19:21 +0200115 bool converged_filter,
peah86afe9d2017-04-06 15:45:32 -0700116 const RenderBuffer& render_buffer,
peah522d71b2017-02-23 05:16:26 -0800117 const std::array<float, kFftLengthBy2Plus1>& E2_main,
peah522d71b2017-02-23 05:16:26 -0800118 const std::array<float, kFftLengthBy2Plus1>& Y2,
peah29103572017-07-11 02:54:02 -0700119 const std::array<float, kBlockSize>& s_main,
peah522d71b2017-02-23 05:16:26 -0800120 bool echo_leakage_detected);
121
122 private:
peah29103572017-07-11 02:54:02 -0700123 class EchoAudibility {
124 public:
125 void Update(rtc::ArrayView<const float> x,
Per Åhgren1b4059e2017-10-15 20:19:21 +0200126 const std::array<float, kBlockSize>& s,
127 bool converged_filter);
peah29103572017-07-11 02:54:02 -0700128 void UpdateWithOutput(rtc::ArrayView<const float> e);
129 bool InaudibleEcho() const { return inaudible_echo_; }
130
131 private:
132 float max_nearend_ = 0.f;
133 size_t max_nearend_counter_ = 0;
134 size_t low_farend_counter_ = 0;
135 bool inaudible_echo_ = false;
136 };
137
Per Åhgren09a718a2017-12-11 22:28:45 +0100138 void UpdateReverb(const std::vector<float>& impulse_response);
Per Åhgren4b3bc0f2017-12-20 15:26:13 +0100139 bool DetectActiveRender(rtc::ArrayView<const float> x) const;
Per Åhgrenb6b00dc2018-02-20 22:18:27 +0100140 void UpdateSuppressorGainLimit(bool render_activity);
Per Åhgren4b3bc0f2017-12-20 15:26:13 +0100141 bool DetectEchoSaturation(rtc::ArrayView<const float> x);
peah29103572017-07-11 02:54:02 -0700142
peah522d71b2017-02-23 05:16:26 -0800143 static int instance_count_;
144 std::unique_ptr<ApmDataDumper> data_dumper_;
145 ErlEstimator erl_estimator_;
146 ErleEstimator erle_estimator_;
Per Åhgren1b4059e2017-10-15 20:19:21 +0200147 size_t capture_block_counter_ = 0;
Per Åhgren4b3bc0f2017-12-20 15:26:13 +0100148 size_t blocks_with_proper_filter_adaptation_ = 0;
149 size_t blocks_with_active_render_ = 0;
peah522d71b2017-02-23 05:16:26 -0800150 bool usable_linear_estimate_ = false;
151 bool echo_leakage_detected_ = false;
peah522d71b2017-02-23 05:16:26 -0800152 bool capture_signal_saturation_ = false;
peah86afe9d2017-04-06 15:45:32 -0700153 bool echo_saturation_ = false;
Per Åhgren1b4059e2017-10-15 20:19:21 +0200154 bool transparent_mode_ = false;
Per Åhgren63b494d2017-12-06 11:32:38 +0100155 float previous_max_sample_ = 0.f;
peahe52a2032017-04-19 09:03:40 -0700156 bool render_received_ = false;
Per Åhgrenb6b00dc2018-02-20 22:18:27 +0100157 int realignment_counter_ = 0;
158 float suppressor_gain_limit_ = 1.f;
159 bool active_render_seen_ = false;
Per Åhgren0e6d2f52017-12-20 22:19:56 +0100160 int filter_delay_ = 0;
peah86afe9d2017-04-06 15:45:32 -0700161 size_t blocks_since_last_saturation_ = 1000;
peah29103572017-07-11 02:54:02 -0700162 float reverb_decay_to_test_ = 0.9f;
163 float reverb_decay_candidate_ = 0.f;
164 float reverb_decay_candidate_residual_ = -1.f;
165 EchoAudibility echo_audibility_;
Gustaf Ullbergbd83b912017-10-18 12:32:42 +0200166 const EchoCanceller3Config config_;
Per Åhgren09a718a2017-12-11 22:28:45 +0100167 std::vector<float> max_render_;
peah8cee56f2017-08-24 22:36:53 -0700168 float reverb_decay_;
Per Åhgren7ddd4632017-10-25 02:59:45 +0200169 bool saturating_echo_path_ = false;
Per Åhgren4b3bc0f2017-12-20 15:26:13 +0100170 bool filter_has_had_time_to_converge_ = false;
Per Åhgrena98c8072018-01-15 19:17:16 +0100171 bool initial_state_ = true;
Per Åhgrenb6b00dc2018-02-20 22:18:27 +0100172 const float gain_rampup_increase_;
peah29103572017-07-11 02:54:02 -0700173
peah8cee56f2017-08-24 22:36:53 -0700174 RTC_DISALLOW_COPY_AND_ASSIGN(AecState);
peah522d71b2017-02-23 05:16:26 -0800175};
176
177} // namespace webrtc
178
Mirko Bonadei92ea95e2017-09-15 06:47:31 +0200179#endif // MODULES_AUDIO_PROCESSING_AEC3_AEC_STATE_H_