blob: 1d55647693de9c0fbf1fb2c526fde9944bc338bf [file] [log] [blame]
peah522d71b2017-02-23 05:16:26 -08001/*
2 * Copyright (c) 2017 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020011#ifndef MODULES_AUDIO_PROCESSING_AEC3_SUPPRESSION_GAIN_H_
12#define MODULES_AUDIO_PROCESSING_AEC3_SUPPRESSION_GAIN_H_
peah522d71b2017-02-23 05:16:26 -080013
14#include <array>
Yves Gerey988cc082018-10-23 12:03:01 +020015#include <memory>
peah86afe9d2017-04-06 15:45:32 -070016#include <vector>
peah522d71b2017-02-23 05:16:26 -080017
Yves Gerey988cc082018-10-23 12:03:01 +020018#include "absl/types/optional.h"
19#include "api/array_view.h"
Gustaf Ullberg3646f972018-02-14 15:19:04 +010020#include "api/audio/echo_canceller3_config.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020021#include "modules/audio_processing/aec3/aec3_common.h"
Per Åhgren7ddd4632017-10-25 02:59:45 +020022#include "modules/audio_processing/aec3/aec_state.h"
Yves Gerey988cc082018-10-23 12:03:01 +020023#include "modules/audio_processing/aec3/fft_data.h"
Gustaf Ullberg8406c432018-06-19 12:31:33 +020024#include "modules/audio_processing/aec3/moving_average.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020025#include "modules/audio_processing/aec3/render_signal_analyzer.h"
Yves Gerey988cc082018-10-23 12:03:01 +020026#include "modules/audio_processing/logging/apm_data_dumper.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020027#include "rtc_base/constructormagic.h"
peah522d71b2017-02-23 05:16:26 -080028
29namespace webrtc {
peah522d71b2017-02-23 05:16:26 -080030
31class SuppressionGain {
32 public:
Gustaf Ullbergbd83b912017-10-18 12:32:42 +020033 SuppressionGain(const EchoCanceller3Config& config,
Per Åhgren47d7fbd2018-04-24 12:44:29 +020034 Aec3Optimization optimization,
35 int sample_rate_hz);
36 ~SuppressionGain();
37 void GetGain(
Jesús de Vicente Peña0faf0822018-09-24 12:48:28 +020038 const std::array<float, kFftLengthBy2Plus1>& suppressor_input_spectrum,
Per Åhgren47d7fbd2018-04-24 12:44:29 +020039 const std::array<float, kFftLengthBy2Plus1>& nearend_spectrum,
40 const std::array<float, kFftLengthBy2Plus1>& echo_spectrum,
Per Åhgrenfde4aa92018-08-27 14:19:35 +020041 const std::array<float, kFftLengthBy2Plus1>& residual_echo_spectrum,
Per Åhgren47d7fbd2018-04-24 12:44:29 +020042 const std::array<float, kFftLengthBy2Plus1>& comfort_noise_spectrum,
43 const FftData& linear_aec_fft,
Per Åhgren47d7fbd2018-04-24 12:44:29 +020044 const FftData& capture_fft,
45 const RenderSignalAnalyzer& render_signal_analyzer,
46 const AecState& aec_state,
47 const std::vector<std::vector<float>>& render,
48 float* high_bands_gain,
49 std::array<float, kFftLengthBy2Plus1>* low_band_gain);
peah522d71b2017-02-23 05:16:26 -080050
Per Åhgren5f1a31c2018-03-08 15:54:41 +010051 // Toggles the usage of the initial state.
52 void SetInitialState(bool state);
53
peah522d71b2017-02-23 05:16:26 -080054 private:
Per Åhgrenfde4aa92018-08-27 14:19:35 +020055 // Computes the gain to apply for the bands beyond the first band.
56 float UpperBandsGain(
57 const std::array<float, kFftLengthBy2Plus1>& echo_spectrum,
58 const std::array<float, kFftLengthBy2Plus1>& comfort_noise_spectrum,
59 const absl::optional<int>& narrow_peak_band,
60 bool saturated_echo,
61 const std::vector<std::vector<float>>& render,
62 const std::array<float, kFftLengthBy2Plus1>& low_band_gain) const;
63
Gustaf Ullbergec642172018-07-03 13:48:32 +020064 void GainToNoAudibleEcho(
65 const std::array<float, kFftLengthBy2Plus1>& nearend,
66 const std::array<float, kFftLengthBy2Plus1>& echo,
67 const std::array<float, kFftLengthBy2Plus1>& masker,
68 const std::array<float, kFftLengthBy2Plus1>& min_gain,
69 const std::array<float, kFftLengthBy2Plus1>& max_gain,
70 std::array<float, kFftLengthBy2Plus1>* gain) const;
71
Jesús de Vicente Peña0faf0822018-09-24 12:48:28 +020072 void LowerBandGain(
73 bool stationary_with_low_power,
74 const AecState& aec_state,
75 const std::array<float, kFftLengthBy2Plus1>& suppressor_input,
76 const std::array<float, kFftLengthBy2Plus1>& nearend,
77 const std::array<float, kFftLengthBy2Plus1>& residual_echo,
78 const std::array<float, kFftLengthBy2Plus1>& comfort_noise,
79 std::array<float, kFftLengthBy2Plus1>* gain);
80
81 void GetMinGain(rtc::ArrayView<const float> suppressor_input,
82 rtc::ArrayView<const float> weighted_residual_echo,
83 bool low_noise_render,
84 bool saturated_echo,
85 rtc::ArrayView<float> min_gain) const;
86
87 void GetMaxGain(rtc::ArrayView<float> max_gain) const;
peah1d680892017-05-23 04:07:10 -070088
89 class LowNoiseRenderDetector {
90 public:
91 bool Detect(const std::vector<std::vector<float>>& render);
92
93 private:
94 float average_power_ = 32768.f * 32768.f;
95 };
96
Per Åhgren524e8782018-08-24 22:48:49 +020097 // Class for selecting whether the suppressor is in the nearend or echo state.
98 class DominantNearendDetector {
99 public:
100 explicit DominantNearendDetector(
101 const EchoCanceller3Config::Suppressor::DominantNearendDetection
102 config);
103
104 // Returns whether the current state is the nearend state.
105 bool IsNearendState() const { return nearend_state_; }
106
107 // Updates the state selection based on latest spectral estimates.
108 void Update(rtc::ArrayView<const float> nearend_spectrum,
Per Åhgrenfde4aa92018-08-27 14:19:35 +0200109 rtc::ArrayView<const float> residual_echo_spectrum,
Per Åhgren524e8782018-08-24 22:48:49 +0200110 rtc::ArrayView<const float> comfort_noise_spectrum);
111
112 private:
113 const float enr_threshold_;
Gustaf Ullbergc9f9b872018-10-22 15:15:36 +0200114 const float enr_exit_threshold_;
Per Åhgren524e8782018-08-24 22:48:49 +0200115 const float snr_threshold_;
116 const int hold_duration_;
117 const int trigger_threshold_;
118
119 bool nearend_state_ = false;
120 int trigger_counter_ = 0;
121 int hold_counter_ = 0;
122 };
123
124 struct GainParameters {
125 explicit GainParameters(
126 const EchoCanceller3Config::Suppressor::Tuning& tuning);
127 const float max_inc_factor;
128 const float max_dec_factor_lf;
129 std::array<float, kFftLengthBy2Plus1> enr_transparent_;
130 std::array<float, kFftLengthBy2Plus1> enr_suppress_;
131 std::array<float, kFftLengthBy2Plus1> emr_transparent_;
132 };
133
Gustaf Ullberg216af842018-04-26 12:39:11 +0200134 static int instance_count_;
135 std::unique_ptr<ApmDataDumper> data_dumper_;
peah522d71b2017-02-23 05:16:26 -0800136 const Aec3Optimization optimization_;
Per Åhgren5f1a31c2018-03-08 15:54:41 +0100137 const EchoCanceller3Config config_;
138 const int state_change_duration_blocks_;
139 float one_by_state_change_duration_blocks_;
peah1d680892017-05-23 04:07:10 -0700140 std::array<float, kFftLengthBy2Plus1> last_gain_;
Gustaf Ullberg0e6375e2018-05-04 11:29:02 +0200141 std::array<float, kFftLengthBy2Plus1> last_nearend_;
peah1d680892017-05-23 04:07:10 -0700142 std::array<float, kFftLengthBy2Plus1> last_echo_;
peah1d680892017-05-23 04:07:10 -0700143 LowNoiseRenderDetector low_render_detector_;
Per Åhgren5f1a31c2018-03-08 15:54:41 +0100144 bool initial_state_ = true;
145 int initial_state_change_counter_ = 0;
Gustaf Ullberg8406c432018-06-19 12:31:33 +0200146 aec3::MovingAverage moving_average_;
Per Åhgren524e8782018-08-24 22:48:49 +0200147 const GainParameters nearend_params_;
148 const GainParameters normal_params_;
149 DominantNearendDetector dominant_nearend_detector_;
Per Åhgren47d7fbd2018-04-24 12:44:29 +0200150
peah8cee56f2017-08-24 22:36:53 -0700151 RTC_DISALLOW_COPY_AND_ASSIGN(SuppressionGain);
peah522d71b2017-02-23 05:16:26 -0800152};
153
154} // namespace webrtc
155
Mirko Bonadei92ea95e2017-09-15 06:47:31 +0200156#endif // MODULES_AUDIO_PROCESSING_AEC3_SUPPRESSION_GAIN_H_