blob: 174647c956601314f09e6852fb40c127a83c6aff [file] [log] [blame]
alessiob3ec96df2017-05-22 06:57:06 -07001/*
2 * Copyright (c) 2017 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
Alex Loikoe36e8bb2018-02-16 11:54:07 +010011#include "modules/audio_processing/gain_controller2.h"
alessiob3ec96df2017-05-22 06:57:06 -070012
Alessio Bazzica38901042021-10-14 12:14:21 +020013#include <memory>
14#include <utility>
15
Alessio Bazzica3e4c77f2018-11-01 21:31:38 +010016#include "common_audio/include/audio_util.h"
Alessio Bazzicab4d4ae22021-10-15 13:57:56 +020017#include "modules/audio_processing/agc2/cpu_features.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020018#include "modules/audio_processing/audio_buffer.h"
Alex Loikoe36e8bb2018-02-16 11:54:07 +010019#include "modules/audio_processing/include/audio_frame_view.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020020#include "modules/audio_processing/logging/apm_data_dumper.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020021#include "rtc_base/checks.h"
Alessio Bazzica08d2a702020-11-20 16:26:24 +010022#include "rtc_base/logging.h"
Jonas Olsson366a50c2018-09-06 13:41:30 +020023#include "rtc_base/strings/string_builder.h"
Alessio Bazzicab4d4ae22021-10-15 13:57:56 +020024#include "system_wrappers/include/field_trial.h"
alessiob3ec96df2017-05-22 06:57:06 -070025
26namespace webrtc {
Alessio Bazzica82ea4ee2021-10-07 09:21:02 +020027namespace {
Alessio Bazzica38901042021-10-14 12:14:21 +020028
29using Agc2Config = AudioProcessing::Config::GainController2;
Hanna Silena6574902022-11-30 16:59:05 +010030using InputVolumeControllerConfig = InputVolumeController::Config;
Alessio Bazzica38901042021-10-14 12:14:21 +020031
Alessio Bazzica82ea4ee2021-10-07 09:21:02 +020032constexpr int kLogLimiterStatsPeriodMs = 30'000;
33constexpr int kFrameLengthMs = 10;
34constexpr int kLogLimiterStatsPeriodNumFrames =
35 kLogLimiterStatsPeriodMs / kFrameLengthMs;
Alessio Bazzica38901042021-10-14 12:14:21 +020036
Alessio Bazzicab4d4ae22021-10-15 13:57:56 +020037// Detects the available CPU features and applies any kill-switches.
38AvailableCpuFeatures GetAllowedCpuFeatures() {
39 AvailableCpuFeatures features = GetAvailableCpuFeatures();
40 if (field_trial::IsEnabled("WebRTC-Agc2SimdSse2KillSwitch")) {
41 features.sse2 = false;
42 }
43 if (field_trial::IsEnabled("WebRTC-Agc2SimdAvx2KillSwitch")) {
44 features.avx2 = false;
45 }
46 if (field_trial::IsEnabled("WebRTC-Agc2SimdNeonKillSwitch")) {
47 features.neon = false;
48 }
49 return features;
50}
51
Alessio Bazzica38901042021-10-14 12:14:21 +020052// Creates an adaptive digital gain controller if enabled.
Alessio Bazzica2fa46182021-10-26 14:08:23 +020053std::unique_ptr<AdaptiveDigitalGainController> CreateAdaptiveDigitalController(
Alessio Bazzica38901042021-10-14 12:14:21 +020054 const Agc2Config::AdaptiveDigital& config,
55 int sample_rate_hz,
56 int num_channels,
57 ApmDataDumper* data_dumper) {
58 if (config.enabled) {
Alessio Bazzica2fa46182021-10-26 14:08:23 +020059 return std::make_unique<AdaptiveDigitalGainController>(
60 data_dumper, config, sample_rate_hz, num_channels);
Alessio Bazzica38901042021-10-14 12:14:21 +020061 }
62 return nullptr;
63}
64
Hanna Silend7cfbe32022-11-02 19:12:20 +010065// Creates an input volume controller if `enabled` is true.
66std::unique_ptr<InputVolumeController> CreateInputVolumeController(
67 bool enabled,
Hanna Silena6574902022-11-30 16:59:05 +010068 const InputVolumeControllerConfig& config,
Hanna Silend7cfbe32022-11-02 19:12:20 +010069 int num_channels) {
70 if (enabled) {
Hanna Silena6574902022-11-30 16:59:05 +010071 return std::make_unique<InputVolumeController>(num_channels, config);
Hanna Silend7cfbe32022-11-02 19:12:20 +010072 }
73 return nullptr;
74}
75
Alessio Bazzica82ea4ee2021-10-07 09:21:02 +020076} // namespace
alessiob3ec96df2017-05-22 06:57:06 -070077
Niels Möller7a669002022-06-27 09:47:02 +020078std::atomic<int> GainController2::instance_count_(0);
alessiob3ec96df2017-05-22 06:57:06 -070079
Hanna Silena6574902022-11-30 16:59:05 +010080GainController2::GainController2(
81 const Agc2Config& config,
82 const InputVolumeControllerConfig& input_volume_controller_config,
83 int sample_rate_hz,
84 int num_channels,
85 bool use_internal_vad)
Alessio Bazzicab4d4ae22021-10-15 13:57:56 +020086 : cpu_features_(GetAllowedCpuFeatures()),
Niels Möller7a669002022-06-27 09:47:02 +020087 data_dumper_(instance_count_.fetch_add(1) + 1),
Alessio Bazzica60f675f2021-10-15 15:36:11 +020088 fixed_gain_applier_(
89 /*hard_clip_samples=*/false,
90 /*initial_gain_factor=*/DbToRatio(config.fixed_digital.gain_db)),
Alessio Bazzica38901042021-10-14 12:14:21 +020091 adaptive_digital_controller_(
92 CreateAdaptiveDigitalController(config.adaptive_digital,
93 sample_rate_hz,
94 num_channels,
95 &data_dumper_)),
Hanna Silend7cfbe32022-11-02 19:12:20 +010096 input_volume_controller_(
97 CreateInputVolumeController(config.input_volume_controller.enabled,
Hanna Silena6574902022-11-30 16:59:05 +010098 input_volume_controller_config,
Hanna Silend7cfbe32022-11-02 19:12:20 +010099 num_channels)),
Alessio Bazzica38901042021-10-14 12:14:21 +0200100 limiter_(sample_rate_hz, &data_dumper_, /*histogram_name_prefix=*/"Agc2"),
Alessio Bazzicafcf1af32022-09-07 17:14:26 +0200101 calls_since_last_limiter_log_(0) {
Alessio Bazzica38901042021-10-14 12:14:21 +0200102 RTC_DCHECK(Validate(config));
103 data_dumper_.InitiateNewSetOfRecordings();
Alessio Bazzicab4d4ae22021-10-15 13:57:56 +0200104 const bool use_vad = config.adaptive_digital.enabled;
Hanna Silen0c1ad292022-06-16 16:35:45 +0200105 if (use_vad && use_internal_vad) {
Alessio Bazzicab4d4ae22021-10-15 13:57:56 +0200106 // TODO(bugs.webrtc.org/7494): Move `vad_reset_period_ms` from adaptive
107 // digital to gain controller 2 config.
108 vad_ = std::make_unique<VoiceActivityDetectorWrapper>(
109 config.adaptive_digital.vad_reset_period_ms, cpu_features_,
110 sample_rate_hz);
111 }
Hanna Silend7cfbe32022-11-02 19:12:20 +0100112 if (input_volume_controller_) {
113 input_volume_controller_->Initialize();
114 }
Per Åhgren2bd85ab2020-01-03 10:36:34 +0100115}
alessiob3ec96df2017-05-22 06:57:06 -0700116
117GainController2::~GainController2() = default;
118
Hanna Silend7cfbe32022-11-02 19:12:20 +0100119// TODO(webrtc:7494): Pass the flag also to the other components.
120void GainController2::SetCaptureOutputUsed(bool capture_output_used) {
121 if (input_volume_controller_) {
122 input_volume_controller_->HandleCaptureOutputUsedChange(
123 capture_output_used);
124 }
125}
126
Alessio Bazzica38901042021-10-14 12:14:21 +0200127void GainController2::SetFixedGainDb(float gain_db) {
128 const float gain_factor = DbToRatio(gain_db);
129 if (fixed_gain_applier_.GetGainFactor() != gain_factor) {
130 // Reset the limiter to quickly react on abrupt level changes caused by
131 // large changes of the fixed gain.
132 limiter_.Reset();
133 }
134 fixed_gain_applier_.SetGainFactor(gain_factor);
Alessio Bazzica270f7b52017-10-13 11:05:17 +0200135}
136
Hanna Silend7cfbe32022-11-02 19:12:20 +0100137void GainController2::Analyze(int applied_input_volume,
138 const AudioBuffer& audio_buffer) {
139 RTC_DCHECK_GE(applied_input_volume, 0);
140 RTC_DCHECK_LE(applied_input_volume, 255);
141
142 if (input_volume_controller_) {
143 input_volume_controller_->set_stream_analog_level(applied_input_volume);
144 input_volume_controller_->AnalyzePreProcess(audio_buffer);
145 }
146}
147
148absl::optional<int> GainController2::GetRecommendedInputVolume() const {
149 return input_volume_controller_
150 ? absl::optional<int>(
151 input_volume_controller_->recommended_analog_level())
152 : absl::nullopt;
153}
154
Hanna Silen0c1ad292022-06-16 16:35:45 +0200155void GainController2::Process(absl::optional<float> speech_probability,
Alessio Bazzicafcf1af32022-09-07 17:14:26 +0200156 bool input_volume_changed,
Hanna Silen0c1ad292022-06-16 16:35:45 +0200157 AudioBuffer* audio) {
Alessio Bazzicafcf1af32022-09-07 17:14:26 +0200158 data_dumper_.DumpRaw("agc2_applied_input_volume_changed",
159 input_volume_changed);
160 if (input_volume_changed && !!adaptive_digital_controller_) {
161 adaptive_digital_controller_->HandleInputGainChange();
162 }
163
Per Åhgrend47941e2019-08-22 11:51:13 +0200164 AudioFrameView<float> float_frame(audio->channels(), audio->num_channels(),
Alex Loikoe36e8bb2018-02-16 11:54:07 +0100165 audio->num_frames());
Alessio Bazzicab4d4ae22021-10-15 13:57:56 +0200166 if (vad_) {
167 speech_probability = vad_->Analyze(float_frame);
Hanna Silen0c1ad292022-06-16 16:35:45 +0200168 } else if (speech_probability.has_value()) {
169 RTC_DCHECK_GE(speech_probability.value(), 0.0f);
170 RTC_DCHECK_LE(speech_probability.value(), 1.0f);
171 }
172 if (speech_probability.has_value()) {
Alessio Bazzicab4d4ae22021-10-15 13:57:56 +0200173 data_dumper_.DumpRaw("agc2_speech_probability", speech_probability.value());
174 }
Hanna Silend7cfbe32022-11-02 19:12:20 +0100175
176 if (input_volume_controller_) {
Hanna Silen27fed452022-11-22 15:00:58 +0100177 // TODO(bugs.webrtc.org/7494): A temprorary check, remove once not needed.
178 RTC_DCHECK(adaptive_digital_controller_);
Hanna Silend7cfbe32022-11-02 19:12:20 +0100179 absl::optional<float> speech_level;
180 if (adaptive_digital_controller_) {
181 speech_level =
182 adaptive_digital_controller_->GetSpeechLevelDbfsIfConfident();
183 }
Hanna Silen27fed452022-11-22 15:00:58 +0100184 RTC_DCHECK(speech_probability.has_value());
185 if (speech_probability.has_value()) {
186 input_volume_controller_->Process(*speech_probability, speech_level);
187 }
Hanna Silend7cfbe32022-11-02 19:12:20 +0100188 }
189
Alessio Bazzica82ea4ee2021-10-07 09:21:02 +0200190 if (adaptive_digital_controller_) {
Alessio Bazzicab4d4ae22021-10-15 13:57:56 +0200191 RTC_DCHECK(speech_probability.has_value());
192 adaptive_digital_controller_->Process(
193 float_frame, speech_probability.value(), limiter_.LastAudioLevel());
Alex Loikoe5831742018-08-24 11:28:36 +0200194 }
Alessio Bazzica4366c542022-12-05 16:31:16 +0100195
196 fixed_gain_applier_.ApplyGain(float_frame);
197
Alessio Bazzica3e4c77f2018-11-01 21:31:38 +0100198 limiter_.Process(float_frame);
Alessio Bazzica08d2a702020-11-20 16:26:24 +0100199
Alessio Bazzica82ea4ee2021-10-07 09:21:02 +0200200 // Periodically log limiter stats.
201 if (++calls_since_last_limiter_log_ == kLogLimiterStatsPeriodNumFrames) {
Alessio Bazzica08d2a702020-11-20 16:26:24 +0100202 calls_since_last_limiter_log_ = 0;
203 InterpolatedGainCurve::Stats stats = limiter_.GetGainCurveStats();
204 RTC_LOG(LS_INFO) << "AGC2 limiter stats"
205 << " | identity: " << stats.look_ups_identity_region
206 << " | knee: " << stats.look_ups_knee_region
207 << " | limiter: " << stats.look_ups_limiter_region
208 << " | saturation: " << stats.look_ups_saturation_region;
209 }
alessiob3ec96df2017-05-22 06:57:06 -0700210}
211
212bool GainController2::Validate(
213 const AudioProcessing::Config::GainController2& config) {
Alessio Bazzica0c83e152020-10-14 12:49:54 +0200214 const auto& fixed = config.fixed_digital;
215 const auto& adaptive = config.adaptive_digital;
Alessio Bazzicaa850e6c2021-10-04 13:35:55 +0200216 return fixed.gain_db >= 0.0f && fixed.gain_db < 50.f &&
217 adaptive.headroom_db >= 0.0f && adaptive.max_gain_db > 0.0f &&
218 adaptive.initial_gain_db >= 0.0f &&
Alessio Bazzica1ac4f2a2021-09-24 14:59:30 +0200219 adaptive.max_gain_change_db_per_second > 0.0f &&
220 adaptive.max_output_noise_level_dbfs <= 0.0f;
alessiob3ec96df2017-05-22 06:57:06 -0700221}
222
223} // namespace webrtc