blob: 83a595e4393343c3c33884d7d86636a0d378a940 [file] [log] [blame]
alessiob3ec96df2017-05-22 06:57:06 -07001/*
2 * Copyright (c) 2017 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
Alex Loikoe36e8bb2018-02-16 11:54:07 +010011#include "modules/audio_processing/gain_controller2.h"
alessiob3ec96df2017-05-22 06:57:06 -070012
Alessio Bazzica38901042021-10-14 12:14:21 +020013#include <memory>
14#include <utility>
15
Alessio Bazzica3e4c77f2018-11-01 21:31:38 +010016#include "common_audio/include/audio_util.h"
Alessio Bazzicab4d4ae22021-10-15 13:57:56 +020017#include "modules/audio_processing/agc2/cpu_features.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020018#include "modules/audio_processing/audio_buffer.h"
Alex Loikoe36e8bb2018-02-16 11:54:07 +010019#include "modules/audio_processing/include/audio_frame_view.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020020#include "modules/audio_processing/logging/apm_data_dumper.h"
Steve Anton10542f22019-01-11 09:11:00 -080021#include "rtc_base/atomic_ops.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020022#include "rtc_base/checks.h"
Alessio Bazzica08d2a702020-11-20 16:26:24 +010023#include "rtc_base/logging.h"
Jonas Olsson366a50c2018-09-06 13:41:30 +020024#include "rtc_base/strings/string_builder.h"
Alessio Bazzicab4d4ae22021-10-15 13:57:56 +020025#include "system_wrappers/include/field_trial.h"
alessiob3ec96df2017-05-22 06:57:06 -070026
27namespace webrtc {
Alessio Bazzica82ea4ee2021-10-07 09:21:02 +020028namespace {
Alessio Bazzica38901042021-10-14 12:14:21 +020029
30using Agc2Config = AudioProcessing::Config::GainController2;
31
32constexpr int kUnspecifiedAnalogLevel = -1;
Alessio Bazzica82ea4ee2021-10-07 09:21:02 +020033constexpr int kLogLimiterStatsPeriodMs = 30'000;
34constexpr int kFrameLengthMs = 10;
35constexpr int kLogLimiterStatsPeriodNumFrames =
36 kLogLimiterStatsPeriodMs / kFrameLengthMs;
Alessio Bazzica38901042021-10-14 12:14:21 +020037
Alessio Bazzicab4d4ae22021-10-15 13:57:56 +020038// Detects the available CPU features and applies any kill-switches.
39AvailableCpuFeatures GetAllowedCpuFeatures() {
40 AvailableCpuFeatures features = GetAvailableCpuFeatures();
41 if (field_trial::IsEnabled("WebRTC-Agc2SimdSse2KillSwitch")) {
42 features.sse2 = false;
43 }
44 if (field_trial::IsEnabled("WebRTC-Agc2SimdAvx2KillSwitch")) {
45 features.avx2 = false;
46 }
47 if (field_trial::IsEnabled("WebRTC-Agc2SimdNeonKillSwitch")) {
48 features.neon = false;
49 }
50 return features;
51}
52
Alessio Bazzica38901042021-10-14 12:14:21 +020053// Creates an adaptive digital gain controller if enabled.
Alessio Bazzica2fa46182021-10-26 14:08:23 +020054std::unique_ptr<AdaptiveDigitalGainController> CreateAdaptiveDigitalController(
Alessio Bazzica38901042021-10-14 12:14:21 +020055 const Agc2Config::AdaptiveDigital& config,
56 int sample_rate_hz,
57 int num_channels,
58 ApmDataDumper* data_dumper) {
59 if (config.enabled) {
Alessio Bazzica2fa46182021-10-26 14:08:23 +020060 return std::make_unique<AdaptiveDigitalGainController>(
61 data_dumper, config, sample_rate_hz, num_channels);
Alessio Bazzica38901042021-10-14 12:14:21 +020062 }
63 return nullptr;
64}
65
Alessio Bazzica82ea4ee2021-10-07 09:21:02 +020066} // namespace
alessiob3ec96df2017-05-22 06:57:06 -070067
alessiob3ec96df2017-05-22 06:57:06 -070068int GainController2::instance_count_ = 0;
69
Alessio Bazzica38901042021-10-14 12:14:21 +020070GainController2::GainController2(const Agc2Config& config,
71 int sample_rate_hz,
Hanna Silen0c1ad292022-06-16 16:35:45 +020072 int num_channels,
73 bool use_internal_vad)
Alessio Bazzicab4d4ae22021-10-15 13:57:56 +020074 : cpu_features_(GetAllowedCpuFeatures()),
75 data_dumper_(rtc::AtomicOps::Increment(&instance_count_)),
Alessio Bazzica60f675f2021-10-15 15:36:11 +020076 fixed_gain_applier_(
77 /*hard_clip_samples=*/false,
78 /*initial_gain_factor=*/DbToRatio(config.fixed_digital.gain_db)),
Alessio Bazzica38901042021-10-14 12:14:21 +020079 adaptive_digital_controller_(
80 CreateAdaptiveDigitalController(config.adaptive_digital,
81 sample_rate_hz,
82 num_channels,
83 &data_dumper_)),
84 limiter_(sample_rate_hz, &data_dumper_, /*histogram_name_prefix=*/"Agc2"),
85 calls_since_last_limiter_log_(0),
86 analog_level_(kUnspecifiedAnalogLevel) {
87 RTC_DCHECK(Validate(config));
88 data_dumper_.InitiateNewSetOfRecordings();
Alessio Bazzicab4d4ae22021-10-15 13:57:56 +020089 const bool use_vad = config.adaptive_digital.enabled;
Hanna Silen0c1ad292022-06-16 16:35:45 +020090 if (use_vad && use_internal_vad) {
Alessio Bazzicab4d4ae22021-10-15 13:57:56 +020091 // TODO(bugs.webrtc.org/7494): Move `vad_reset_period_ms` from adaptive
92 // digital to gain controller 2 config.
93 vad_ = std::make_unique<VoiceActivityDetectorWrapper>(
94 config.adaptive_digital.vad_reset_period_ms, cpu_features_,
95 sample_rate_hz);
96 }
Per Åhgren2bd85ab2020-01-03 10:36:34 +010097}
alessiob3ec96df2017-05-22 06:57:06 -070098
99GainController2::~GainController2() = default;
100
Alessio Bazzicad66a6052021-04-29 16:13:25 +0200101void GainController2::Initialize(int sample_rate_hz, int num_channels) {
Alessio Bazzica270f7b52017-10-13 11:05:17 +0200102 RTC_DCHECK(sample_rate_hz == AudioProcessing::kSampleRate8kHz ||
103 sample_rate_hz == AudioProcessing::kSampleRate16kHz ||
104 sample_rate_hz == AudioProcessing::kSampleRate32kHz ||
105 sample_rate_hz == AudioProcessing::kSampleRate48kHz);
Alessio Bazzica38901042021-10-14 12:14:21 +0200106 // TODO(bugs.webrtc.org/7494): Initialize `fixed_gain_applier_`.
Alessio Bazzica3e4c77f2018-11-01 21:31:38 +0100107 limiter_.SetSampleRate(sample_rate_hz);
Alessio Bazzicab4d4ae22021-10-15 13:57:56 +0200108 if (vad_) {
109 vad_->Initialize(sample_rate_hz);
110 }
Alessio Bazzica82ea4ee2021-10-07 09:21:02 +0200111 if (adaptive_digital_controller_) {
112 adaptive_digital_controller_->Initialize(sample_rate_hz, num_channels);
Alessio Bazzicad66a6052021-04-29 16:13:25 +0200113 }
Alessio Bazzica8aaa6042021-03-31 15:16:05 +0200114 data_dumper_.InitiateNewSetOfRecordings();
Alessio Bazzica08d2a702020-11-20 16:26:24 +0100115 calls_since_last_limiter_log_ = 0;
Alessio Bazzica38901042021-10-14 12:14:21 +0200116 analog_level_ = kUnspecifiedAnalogLevel;
117}
118
119void GainController2::SetFixedGainDb(float gain_db) {
120 const float gain_factor = DbToRatio(gain_db);
121 if (fixed_gain_applier_.GetGainFactor() != gain_factor) {
122 // Reset the limiter to quickly react on abrupt level changes caused by
123 // large changes of the fixed gain.
124 limiter_.Reset();
125 }
126 fixed_gain_applier_.SetGainFactor(gain_factor);
Alessio Bazzica270f7b52017-10-13 11:05:17 +0200127}
128
Hanna Silen0c1ad292022-06-16 16:35:45 +0200129void GainController2::Process(absl::optional<float> speech_probability,
130 AudioBuffer* audio) {
Alessio Bazzica8aaa6042021-03-31 15:16:05 +0200131 data_dumper_.DumpRaw("agc2_notified_analog_level", analog_level_);
Per Åhgrend47941e2019-08-22 11:51:13 +0200132 AudioFrameView<float> float_frame(audio->channels(), audio->num_channels(),
Alex Loikoe36e8bb2018-02-16 11:54:07 +0100133 audio->num_frames());
Alessio Bazzicab4d4ae22021-10-15 13:57:56 +0200134 if (vad_) {
135 speech_probability = vad_->Analyze(float_frame);
Hanna Silen0c1ad292022-06-16 16:35:45 +0200136 } else if (speech_probability.has_value()) {
137 RTC_DCHECK_GE(speech_probability.value(), 0.0f);
138 RTC_DCHECK_LE(speech_probability.value(), 1.0f);
139 }
140 if (speech_probability.has_value()) {
Alessio Bazzicab4d4ae22021-10-15 13:57:56 +0200141 data_dumper_.DumpRaw("agc2_speech_probability", speech_probability.value());
142 }
Alessio Bazzica60f675f2021-10-15 15:36:11 +0200143 fixed_gain_applier_.ApplyGain(float_frame);
Alessio Bazzica82ea4ee2021-10-07 09:21:02 +0200144 if (adaptive_digital_controller_) {
Alessio Bazzicab4d4ae22021-10-15 13:57:56 +0200145 RTC_DCHECK(speech_probability.has_value());
146 adaptive_digital_controller_->Process(
147 float_frame, speech_probability.value(), limiter_.LastAudioLevel());
Alex Loikoe5831742018-08-24 11:28:36 +0200148 }
Alessio Bazzica3e4c77f2018-11-01 21:31:38 +0100149 limiter_.Process(float_frame);
Alessio Bazzica08d2a702020-11-20 16:26:24 +0100150
Alessio Bazzica82ea4ee2021-10-07 09:21:02 +0200151 // Periodically log limiter stats.
152 if (++calls_since_last_limiter_log_ == kLogLimiterStatsPeriodNumFrames) {
Alessio Bazzica08d2a702020-11-20 16:26:24 +0100153 calls_since_last_limiter_log_ = 0;
154 InterpolatedGainCurve::Stats stats = limiter_.GetGainCurveStats();
155 RTC_LOG(LS_INFO) << "AGC2 limiter stats"
156 << " | identity: " << stats.look_ups_identity_region
157 << " | knee: " << stats.look_ups_knee_region
158 << " | limiter: " << stats.look_ups_limiter_region
159 << " | saturation: " << stats.look_ups_saturation_region;
160 }
alessiob3ec96df2017-05-22 06:57:06 -0700161}
162
Alex Loikoa837dd72018-08-06 16:32:12 +0200163void GainController2::NotifyAnalogLevel(int level) {
Alessio Bazzica82ea4ee2021-10-07 09:21:02 +0200164 if (analog_level_ != level && adaptive_digital_controller_) {
165 adaptive_digital_controller_->HandleInputGainChange();
Alex Loikoa837dd72018-08-06 16:32:12 +0200166 }
167 analog_level_ = level;
168}
169
alessiob3ec96df2017-05-22 06:57:06 -0700170bool GainController2::Validate(
171 const AudioProcessing::Config::GainController2& config) {
Alessio Bazzica0c83e152020-10-14 12:49:54 +0200172 const auto& fixed = config.fixed_digital;
173 const auto& adaptive = config.adaptive_digital;
Alessio Bazzicaa850e6c2021-10-04 13:35:55 +0200174 return fixed.gain_db >= 0.0f && fixed.gain_db < 50.f &&
175 adaptive.headroom_db >= 0.0f && adaptive.max_gain_db > 0.0f &&
176 adaptive.initial_gain_db >= 0.0f &&
Alessio Bazzica1ac4f2a2021-09-24 14:59:30 +0200177 adaptive.max_gain_change_db_per_second > 0.0f &&
178 adaptive.max_output_noise_level_dbfs <= 0.0f;
alessiob3ec96df2017-05-22 06:57:06 -0700179}
180
181} // namespace webrtc