Blame - modules/audio_processing/agc/legacy/digital_agc.cc - webrtc.googlesource.com/src

blob: e0c076650f7ba4e175179c34fe64fdf09aed8206 [file] [log] [blame]

niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	1	/*
				2	* Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
				3	*
				4	* Use of this source code is governed by a BSD-style license
				5	* that can be found in the LICENSE file in the root of the source
				6	* tree. An additional intellectual property rights grant can be found
				7	* in the file PATENTS. All contributing project authors may
				8	* be found in the AUTHORS file in the root of the source tree.
				9	*/
				10
Mirko Bonadei	92ea95e	2017-09-15 06:47:31 +0200	[diff] [blame]	11	#include "modules/audio_processing/agc/legacy/digital_agc.h"
andrew@webrtc.org	3905b0c	2012-01-04 15:47:20 +0000	[diff] [blame]	12
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	13	#include <string.h>
andrew@webrtc.org	3905b0c	2012-01-04 15:47:20 +0000	[diff] [blame]	14
Mirko Bonadei	92ea95e	2017-09-15 06:47:31 +0200	[diff] [blame]	15	#include "modules/audio_processing/agc/legacy/gain_control.h"
Per Åhgren	5b139d6	2020-03-20 15:50:14 +0100	[diff] [blame]	16	#include "rtc_base/checks.h"
				17
				18	namespace webrtc {
				19
				20	namespace {
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	21
				22	// To generate the gaintable, copy&paste the following lines to a Matlab window:
				23	// MaxGain = 6; MinGain = 0; CompRatio = 3; Knee = 1;
				24	// zeros = 0:31; lvl = 2.^(1-zeros);
				25	// A = -10log10(lvl) (CompRatio - 1) / CompRatio;
				26	// B = MaxGain - MinGain;
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	27	// gains = round(2^1610.^(0.05 (MinGain + B * (
				28	// log(exp(-KneeA)+exp(-KneeB)) - log(1+exp(-Knee*B)) ) /
				29	// log(1/(1+exp(Knee*B))))));
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	30	// fprintf(1, '\t%i, %i, %i, %i,\n', gains);
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	31	// % Matlab code for plotting the gain and input/output level characteristic
				32	// (copy/paste the following 3 lines):
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	33	// in = 10log10(lvl); out = 20log10(gains/65536);
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	34	// subplot(121); plot(in, out); axis([-30, 0, -5, 20]); grid on; xlabel('Input
				35	// (dB)'); ylabel('Gain (dB)');
				36	// subplot(122); plot(in, in+out); axis([-30, 0, -30, 5]); grid on;
				37	// xlabel('Input (dB)'); ylabel('Output (dB)');
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	38	// zoom on;
				39
				40	// Generator table for y=log2(1+e^x) in Q8.
andrew@webrtc.org	d77a661	2012-01-04 16:22:24 +0000	[diff] [blame]	41	enum { kGenFuncTableSize = 128 };
pbos@webrtc.org	b7192b8	2013-04-10 07:50:54 +0000	[diff] [blame]	42	static const uint16_t kGenFuncTable[kGenFuncTableSize] = {
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	43	256, 485, 786, 1126, 1484, 1849, 2217, 2586, 2955, 3324, 3693,
				44	4063, 4432, 4801, 5171, 5540, 5909, 6279, 6648, 7017, 7387, 7756,
				45	8125, 8495, 8864, 9233, 9603, 9972, 10341, 10711, 11080, 11449, 11819,
				46	12188, 12557, 12927, 13296, 13665, 14035, 14404, 14773, 15143, 15512, 15881,
				47	16251, 16620, 16989, 17359, 17728, 18097, 18466, 18836, 19205, 19574, 19944,
				48	20313, 20682, 21052, 21421, 21790, 22160, 22529, 22898, 23268, 23637, 24006,
				49	24376, 24745, 25114, 25484, 25853, 26222, 26592, 26961, 27330, 27700, 28069,
				50	28438, 28808, 29177, 29546, 29916, 30285, 30654, 31024, 31393, 31762, 32132,
				51	32501, 32870, 33240, 33609, 33978, 34348, 34717, 35086, 35456, 35825, 36194,
				52	36564, 36933, 37302, 37672, 38041, 38410, 38780, 39149, 39518, 39888, 40257,
				53	40626, 40996, 41365, 41734, 42104, 42473, 42842, 43212, 43581, 43950, 44320,
				54	44689, 45058, 45428, 45797, 46166, 46536, 46905};
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	55
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	56	static const int16_t kAvgDecayTime = 250; // frames; < 3000
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	57
Per Åhgren	5b139d6	2020-03-20 15:50:14 +0100	[diff] [blame]	58	// the 32 most significant bits of A(19) * B(26) >> 13
				59	#define AGC_MUL32(A, B) (((B) >> 13) * (A) + (((0x00001FFF & (B)) * (A)) >> 13))
				60	// C + the 32 most significant bits of A * B
				61	#define AGC_SCALEDIFF32(A, B, C) \
				62	((C) + ((B) >> 16) * (A) + (((0x0000FFFF & (B)) * (A)) >> 16))
				63
				64	} // namespace
				65
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	66	int32_t WebRtcAgc_CalculateGainTable(int32_t* gainTable, // Q16
				67	int16_t digCompGaindB, // Q0
				68	int16_t targetLevelDbfs, // Q0
pbos@webrtc.org	b7192b8	2013-04-10 07:50:54 +0000	[diff] [blame]	69	uint8_t limiterEnable,
Per Åhgren	5b139d6	2020-03-20 15:50:14 +0100	[diff] [blame]	70	int16_t analogTarget) { // Q0
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	71	// This function generates the compressor gain table used in the fixed digital
				72	// part.
				73	uint32_t tmpU32no1, tmpU32no2, absInLevel, logApprox;
				74	int32_t inLevel, limiterLvl;
				75	int32_t tmp32, tmp32no1, tmp32no2, numFIX, den, y32;
				76	const uint16_t kLog10 = 54426; // log2(10) in Q14
				77	const uint16_t kLog10_2 = 49321; // 10*log10(2) in Q14
				78	const uint16_t kLogE_1 = 23637; // log2(e) in Q14
				79	uint16_t constMaxGain;
				80	uint16_t tmpU16, intPart, fracPart;
				81	const int16_t kCompRatio = 3;
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	82	int16_t limiterOffset = 0; // Limiter offset
				83	int16_t limiterIdx, limiterLvlX;
Peter Kasting	55ec1a4	2021-07-27 17:14:26 -0700	[diff] [blame^]	84	int16_t constLinApprox, maxGain, diffGain;
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	85	int16_t i, tmp16, tmp16no1;
				86	int zeros, zerosScale;
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	87
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	88	// Constants
				89	// kLogE_1 = 23637; // log2(e) in Q14
				90	// kLog10 = 54426; // log2(10) in Q14
				91	// kLog10_2 = 49321; // 10*log10(2) in Q14
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	92
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	93	// Calculate maximum digital gain and zero gain level
				94	tmp32no1 = (digCompGaindB - analogTarget) * (kCompRatio - 1);
				95	tmp16no1 = analogTarget - targetLevelDbfs;
				96	tmp16no1 +=
				97	WebRtcSpl_DivW32W16ResW16(tmp32no1 + (kCompRatio >> 1), kCompRatio);
				98	maxGain = WEBRTC_SPL_MAX(tmp16no1, (analogTarget - targetLevelDbfs));
				99	tmp32no1 = maxGain * kCompRatio;
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	100	if ((digCompGaindB <= analogTarget) && (limiterEnable)) {
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	101	limiterOffset = 0;
				102	}
				103
Peter Kasting	55ec1a4	2021-07-27 17:14:26 -0700	[diff] [blame^]	104	// Calculate the difference between maximum gain and gain at 0dB0v
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	105	tmp32no1 = digCompGaindB * (kCompRatio - 1);
				106	diffGain =
				107	WebRtcSpl_DivW32W16ResW16(tmp32no1 + (kCompRatio >> 1), kCompRatio);
				108	if (diffGain < 0 \|\| diffGain >= kGenFuncTableSize) {
kwiberg	1e8ed4a	2016-08-26 04:33:34 -0700	[diff] [blame]	109	RTC_DCHECK(0);
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	110	return -1;
				111	}
				112
				113	// Calculate the limiter level and index:
				114	// limiterLvlX = analogTarget - limiterOffset
				115	// limiterLvl = targetLevelDbfs + limiterOffset/compRatio
				116	limiterLvlX = analogTarget - limiterOffset;
				117	limiterIdx = 2 + WebRtcSpl_DivW32W16ResW16((int32_t)limiterLvlX * (1 << 13),
				118	kLog10_2 / 2);
				119	tmp16no1 =
				120	WebRtcSpl_DivW32W16ResW16(limiterOffset + (kCompRatio >> 1), kCompRatio);
				121	limiterLvl = targetLevelDbfs + tmp16no1;
				122
				123	// Calculate (through table lookup):
				124	// constMaxGain = log2(1+2^(log2(e)*diffGain)); (in Q8)
				125	constMaxGain = kGenFuncTable[diffGain]; // in Q8
				126
				127	// Calculate a parameter used to approximate the fractional part of 2^x with a
				128	// piecewise linear function in Q14:
				129	// constLinApprox = round(3/2(4(3-2sqrt(2))/(log(2)^2)-0.5)2^14);
				130	constLinApprox = 22817; // in Q14
				131
				132	// Calculate a denominator used in the exponential part to convert from dB to
				133	// linear scale:
				134	// den = 20*constMaxGain (in Q8)
				135	den = WEBRTC_SPL_MUL_16_U16(20, constMaxGain); // in Q8
				136
				137	for (i = 0; i < 32; i++) {
				138	// Calculate scaled input level (compressor):
				139	// inLevel =
				140	// fix((-constLog10_2(compRatio-1)(1-i)+fix(compRatio/2))/compRatio)
				141	tmp16 = (int16_t)((kCompRatio - 1) * (i - 1)); // Q0
				142	tmp32 = WEBRTC_SPL_MUL_16_U16(tmp16, kLog10_2) + 1; // Q14
				143	inLevel = WebRtcSpl_DivW32W16(tmp32, kCompRatio); // Q14
				144
				145	// Calculate diffGain-inLevel, to map using the genFuncTable
				146	inLevel = (int32_t)diffGain * (1 << 14) - inLevel; // Q14
				147
				148	// Make calculations on abs(inLevel) and compensate for the sign afterwards.
				149	absInLevel = (uint32_t)WEBRTC_SPL_ABS_W32(inLevel); // Q14
				150
				151	// LUT with interpolation
				152	intPart = (uint16_t)(absInLevel >> 14);
				153	fracPart =
				154	(uint16_t)(absInLevel & 0x00003FFF); // extract the fractional part
				155	tmpU16 = kGenFuncTable[intPart + 1] - kGenFuncTable[intPart]; // Q8
				156	tmpU32no1 = tmpU16 * fracPart; // Q22
				157	tmpU32no1 += (uint32_t)kGenFuncTable[intPart] << 14; // Q22
				158	logApprox = tmpU32no1 >> 8; // Q14
				159	// Compensate for negative exponent using the relation:
				160	// log2(1 + 2^-x) = log2(1 + 2^x) - x
				161	if (inLevel < 0) {
				162	zeros = WebRtcSpl_NormU32(absInLevel);
				163	zerosScale = 0;
				164	if (zeros < 15) {
				165	// Not enough space for multiplication
				166	tmpU32no2 = absInLevel >> (15 - zeros); // Q(zeros-1)
				167	tmpU32no2 = WEBRTC_SPL_UMUL_32_16(tmpU32no2, kLogE_1); // Q(zeros+13)
				168	if (zeros < 9) {
				169	zerosScale = 9 - zeros;
				170	tmpU32no1 >>= zerosScale; // Q(zeros+13)
				171	} else {
				172	tmpU32no2 >>= zeros - 9; // Q22
				173	}
				174	} else {
				175	tmpU32no2 = WEBRTC_SPL_UMUL_32_16(absInLevel, kLogE_1); // Q28
				176	tmpU32no2 >>= 6; // Q22
				177	}
				178	logApprox = 0;
				179	if (tmpU32no2 < tmpU32no1) {
				180	logApprox = (tmpU32no1 - tmpU32no2) >> (8 - zerosScale); // Q14
				181	}
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	182	}
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	183	numFIX = (maxGain * constMaxGain) * (1 << 6); // Q14
				184	numFIX -= (int32_t)logApprox * diffGain; // Q14
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	185
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	186	// Calculate ratio
				187	// Shift \|numFIX\| as much as possible.
				188	// Ensure we avoid wrap-around in \|den\| as well.
Per Åhgren	5b139d6	2020-03-20 15:50:14 +0100	[diff] [blame]	189	if (numFIX > (den >> 8) \|\| -numFIX > (den >> 8)) { // \|den\| is Q8.
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	190	zeros = WebRtcSpl_NormW32(numFIX);
				191	} else {
				192	zeros = WebRtcSpl_NormW32(den) + 8;
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	193	}
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	194	numFIX *= 1 << zeros; // Q(14+zeros)
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	195
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	196	// Shift den so we end up in Qy1
minyue	fd634c4	2016-06-17 04:36:10 -0700	[diff] [blame]	197	tmp32no1 = WEBRTC_SPL_SHIFT_W32(den, zeros - 9); // Q(zeros - 1)
Per Åhgren	5b139d6	2020-03-20 15:50:14 +0100	[diff] [blame]	198	y32 = numFIX / tmp32no1; // in Q15
minyue	fd634c4	2016-06-17 04:36:10 -0700	[diff] [blame]	199	// This is to do rounding in Q14.
				200	y32 = y32 >= 0 ? (y32 + 1) >> 1 : -((-y32 + 1) >> 1);
				201
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	202	if (limiterEnable && (i < limiterIdx)) {
				203	tmp32 = WEBRTC_SPL_MUL_16_U16(i - 1, kLog10_2); // Q14
				204	tmp32 -= limiterLvl * (1 << 14); // Q14
				205	y32 = WebRtcSpl_DivW32W16(tmp32 + 10, 20);
				206	}
				207	if (y32 > 39000) {
				208	tmp32 = (y32 >> 1) * kLog10 + 4096; // in Q27
				209	tmp32 >>= 13; // In Q14.
				210	} else {
				211	tmp32 = y32 * kLog10 + 8192; // in Q28
				212	tmp32 >>= 14; // In Q14.
				213	}
				214	tmp32 += 16 << 14; // in Q14 (Make sure final output is in Q16)
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	215
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	216	// Calculate power
				217	if (tmp32 > 0) {
				218	intPart = (int16_t)(tmp32 >> 14);
				219	fracPart = (uint16_t)(tmp32 & 0x00003FFF); // in Q14
				220	if ((fracPart >> 13) != 0) {
				221	tmp16 = (2 << 14) - constLinApprox;
				222	tmp32no2 = (1 << 14) - fracPart;
				223	tmp32no2 *= tmp16;
				224	tmp32no2 >>= 13;
				225	tmp32no2 = (1 << 14) - tmp32no2;
				226	} else {
				227	tmp16 = constLinApprox - (1 << 14);
				228	tmp32no2 = (fracPart * tmp16) >> 13;
				229	}
				230	fracPart = (uint16_t)tmp32no2;
				231	gainTable[i] =
				232	(1 << intPart) + WEBRTC_SPL_SHIFT_W32(fracPart, intPart - 14);
				233	} else {
				234	gainTable[i] = 0;
				235	}
				236	}
				237
				238	return 0;
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	239	}
				240
pbos@webrtc.org	e468bc9	2014-12-18 09:11:33 +0000	[diff] [blame]	241	int32_t WebRtcAgc_InitDigital(DigitalAgc* stt, int16_t agcMode) {
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	242	if (agcMode == kAgcModeFixedDigital) {
				243	// start at minimum to find correct gain faster
				244	stt->capacitorSlow = 0;
				245	} else {
				246	// start out with 0 dB gain
				247	stt->capacitorSlow = 134217728; // (int32_t)(0.125f * 32768.0f * 32768.0f);
				248	}
				249	stt->capacitorFast = 0;
				250	stt->gain = 65536;
				251	stt->gatePrevious = 0;
				252	stt->agcMode = agcMode;
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	253
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	254	// initialize VADs
				255	WebRtcAgc_InitVad(&stt->vadNearend);
				256	WebRtcAgc_InitVad(&stt->vadFarend);
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	257
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	258	return 0;
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	259	}
				260
pbos@webrtc.org	e468bc9	2014-12-18 09:11:33 +0000	[diff] [blame]	261	int32_t WebRtcAgc_AddFarendToDigital(DigitalAgc* stt,
				262	const int16_t* in_far,
Peter Kasting	dce40cf	2015-08-24 14:52:23 -0700	[diff] [blame]	263	size_t nrSamples) {
kwiberg	1e8ed4a	2016-08-26 04:33:34 -0700	[diff] [blame]	264	RTC_DCHECK(stt);
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	265	// VAD for far end
				266	WebRtcAgc_ProcessVad(&stt->vadFarend, in_far, nrSamples);
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	267
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	268	return 0;
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	269	}
				270
Per Åhgren	77dc199	2019-11-23 00:14:31 +0100	[diff] [blame]	271	// Gains is an 11 element long array (one value per ms, incl start & end).
				272	int32_t WebRtcAgc_ComputeDigitalGains(DigitalAgc* stt,
				273	const int16_t* const* in_near,
				274	size_t num_bands,
				275	uint32_t FS,
				276	int16_t lowlevelSignal,
				277	int32_t gains[11]) {
				278	int32_t tmp32;
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	279	int32_t env[10];
				280	int32_t max_nrg;
				281	int32_t cur_level;
Per Åhgren	77dc199	2019-11-23 00:14:31 +0100	[diff] [blame]	282	int32_t gain32;
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	283	int16_t logratio;
				284	int16_t lower_thr, upper_thr;
				285	int16_t zeros = 0, zeros_fast, frac = 0;
				286	int16_t decay;
				287	int16_t gate, gain_adj;
				288	int16_t k;
Per Åhgren	77dc199	2019-11-23 00:14:31 +0100	[diff] [blame]	289	size_t n, L;
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	290
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	291	// determine number of samples per ms
				292	if (FS == 8000) {
				293	L = 8;
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	294	} else if (FS == 16000 \|\| FS == 32000 \|\| FS == 48000) {
				295	L = 16;
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	296	} else {
				297	return -1;
				298	}
				299
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	300	// VAD for near end
Per Åhgren	77dc199	2019-11-23 00:14:31 +0100	[diff] [blame]	301	logratio = WebRtcAgc_ProcessVad(&stt->vadNearend, in_near[0], L * 10);
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	302
				303	// Account for far end VAD
				304	if (stt->vadFarend.counter > 10) {
				305	tmp32 = 3 * logratio;
				306	logratio = (int16_t)((tmp32 - stt->vadFarend.logRatio) >> 2);
				307	}
				308
				309	// Determine decay factor depending on VAD
				310	// upper_thr = 1.0f;
				311	// lower_thr = 0.25f;
				312	upper_thr = 1024; // Q10
				313	lower_thr = 0; // Q10
				314	if (logratio > upper_thr) {
				315	// decay = -2^17 / DecayTime; -> -65
				316	decay = -65;
				317	} else if (logratio < lower_thr) {
				318	decay = 0;
				319	} else {
				320	// decay = (int16_t)(((lower_thr - logratio)
				321	// * (2^27/(DecayTime*(upper_thr-lower_thr)))) >> 10);
				322	// SUBSTITUTED: 2^27/(DecayTime*(upper_thr-lower_thr)) -> 65
				323	tmp32 = (lower_thr - logratio) * 65;
				324	decay = (int16_t)(tmp32 >> 10);
				325	}
				326
				327	// adjust decay factor for long silence (detected as low standard deviation)
				328	// This is only done in the adaptive modes
				329	if (stt->agcMode != kAgcModeFixedDigital) {
				330	if (stt->vadNearend.stdLongTerm < 4000) {
				331	decay = 0;
				332	} else if (stt->vadNearend.stdLongTerm < 8096) {
				333	// decay = (int16_t)(((stt->vadNearend.stdLongTerm - 4000) * decay) >>
				334	// 12);
				335	tmp32 = (stt->vadNearend.stdLongTerm - 4000) * decay;
				336	decay = (int16_t)(tmp32 >> 12);
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	337	}
				338
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	339	if (lowlevelSignal != 0) {
				340	decay = 0;
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	341	}
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	342	}
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	343	// Find max amplitude per sub frame
				344	// iterate over sub frames
				345	for (k = 0; k < 10; k++) {
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	346	// iterate over samples
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	347	max_nrg = 0;
				348	for (n = 0; n < L; n++) {
Per Åhgren	77dc199	2019-11-23 00:14:31 +0100	[diff] [blame]	349	int32_t nrg = in_near[0][k * L + n] * in_near[0][k * L + n];
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	350	if (nrg > max_nrg) {
				351	max_nrg = nrg;
				352	}
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	353	}
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	354	env[k] = max_nrg;
				355	}
				356
				357	// Calculate gain per sub frame
				358	gains[0] = stt->gain;
				359	for (k = 0; k < 10; k++) {
				360	// Fast envelope follower
				361	// decay time = -131000 / -1000 = 131 (ms)
				362	stt->capacitorFast =
				363	AGC_SCALEDIFF32(-1000, stt->capacitorFast, stt->capacitorFast);
				364	if (env[k] > stt->capacitorFast) {
				365	stt->capacitorFast = env[k];
				366	}
				367	// Slow envelope follower
				368	if (env[k] > stt->capacitorSlow) {
				369	// increase capacitorSlow
				370	stt->capacitorSlow = AGC_SCALEDIFF32(500, (env[k] - stt->capacitorSlow),
				371	stt->capacitorSlow);
				372	} else {
				373	// decrease capacitorSlow
				374	stt->capacitorSlow =
				375	AGC_SCALEDIFF32(decay, stt->capacitorSlow, stt->capacitorSlow);
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	376	}
				377
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	378	// use maximum of both capacitors as current level
				379	if (stt->capacitorFast > stt->capacitorSlow) {
				380	cur_level = stt->capacitorFast;
				381	} else {
				382	cur_level = stt->capacitorSlow;
				383	}
				384	// Translate signal level into gain, using a piecewise linear approximation
				385	// find number of leading zeros
				386	zeros = WebRtcSpl_NormU32((uint32_t)cur_level);
				387	if (cur_level == 0) {
				388	zeros = 31;
				389	}
Alex Loiko	c531af7	2017-10-24 10:41:48 +0200	[diff] [blame]	390	tmp32 = ((uint32_t)cur_level << zeros) & 0x7FFFFFFF;
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	391	frac = (int16_t)(tmp32 >> 19); // Q12.
Sam Zackrisson	762289e	2018-06-26 11:21:22 +0200	[diff] [blame]	392	// Interpolate between gainTable[zeros] and gainTable[zeros-1].
Per Åhgren	5b139d6	2020-03-20 15:50:14 +0100	[diff] [blame]	393	tmp32 =
				394	((stt->gainTable[zeros - 1] - stt->gainTable[zeros]) * (int64_t)frac) >>
				395	12;
Sam Zackrisson	762289e	2018-06-26 11:21:22 +0200	[diff] [blame]	396	gains[k + 1] = stt->gainTable[zeros] + tmp32;
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	397	}
				398
				399	// Gate processing (lower gain during absence of speech)
				400	zeros = (zeros << 9) - (frac >> 3);
				401	// find number of leading zeros
				402	zeros_fast = WebRtcSpl_NormU32((uint32_t)stt->capacitorFast);
				403	if (stt->capacitorFast == 0) {
				404	zeros_fast = 31;
				405	}
Alex Loiko	c531af7	2017-10-24 10:41:48 +0200	[diff] [blame]	406	tmp32 = ((uint32_t)stt->capacitorFast << zeros_fast) & 0x7FFFFFFF;
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	407	zeros_fast <<= 9;
				408	zeros_fast -= (int16_t)(tmp32 >> 22);
				409
				410	gate = 1000 + zeros_fast - zeros - stt->vadNearend.stdShortTerm;
				411
				412	if (gate < 0) {
				413	stt->gatePrevious = 0;
				414	} else {
				415	tmp32 = stt->gatePrevious * 7;
				416	gate = (int16_t)((gate + tmp32) >> 3);
				417	stt->gatePrevious = gate;
				418	}
				419	// gate < 0 -> no gate
				420	// gate > 2500 -> max gate
				421	if (gate > 0) {
				422	if (gate < 2500) {
				423	gain_adj = (2500 - gate) >> 5;
				424	} else {
				425	gain_adj = 0;
				426	}
				427	for (k = 0; k < 10; k++) {
				428	if ((gains[k + 1] - stt->gainTable[0]) > 8388608) {
				429	// To prevent wraparound
				430	tmp32 = (gains[k + 1] - stt->gainTable[0]) >> 8;
				431	tmp32 *= 178 + gain_adj;
				432	} else {
				433	tmp32 = (gains[k + 1] - stt->gainTable[0]) * (178 + gain_adj);
				434	tmp32 >>= 8;
				435	}
				436	gains[k + 1] = stt->gainTable[0] + tmp32;
				437	}
				438	}
				439
				440	// Limit gain to avoid overload distortion
				441	for (k = 0; k < 10; k++) {
Sam Zackrisson	71729eb	2018-07-09 16:06:28 +0200	[diff] [blame]	442	// Find a shift of gains[k + 1] such that it can be squared without
				443	// overflow, but at least by 10 bits.
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	444	zeros = 10;
Sam Zackrisson	71729eb	2018-07-09 16:06:28 +0200	[diff] [blame]	445	if (gains[k + 1] > 47452159) {
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	446	zeros = 16 - WebRtcSpl_NormW32(gains[k + 1]);
				447	}
				448	gain32 = (gains[k + 1] >> zeros) + 1;
				449	gain32 *= gain32;
				450	// check for overflow
				451	while (AGC_MUL32((env[k] >> 12) + 1, gain32) >
				452	WEBRTC_SPL_SHIFT_W32((int32_t)32767, 2 * (1 - zeros + 10))) {
				453	// multiply by 253/256 ==> -0.1 dB
				454	if (gains[k + 1] > 8388607) {
				455	// Prevent wrap around
				456	gains[k + 1] = (gains[k + 1] / 256) * 253;
				457	} else {
				458	gains[k + 1] = (gains[k + 1] * 253) / 256;
				459	}
				460	gain32 = (gains[k + 1] >> zeros) + 1;
				461	gain32 *= gain32;
				462	}
				463	}
				464	// gain reductions should be done 1 ms earlier than gain increases
				465	for (k = 1; k < 10; k++) {
				466	if (gains[k] > gains[k + 1]) {
				467	gains[k] = gains[k + 1];
				468	}
				469	}
				470	// save start gain for next frame
				471	stt->gain = gains[10];
				472
Per Åhgren	77dc199	2019-11-23 00:14:31 +0100	[diff] [blame]	473	return 0;
				474	}
				475
Per Åhgren	5b139d6	2020-03-20 15:50:14 +0100	[diff] [blame]	476	int32_t WebRtcAgc_ApplyDigitalGains(const int32_t gains[11],
				477	size_t num_bands,
				478	uint32_t FS,
				479	const int16_t* const* in_near,
Per Åhgren	77dc199	2019-11-23 00:14:31 +0100	[diff] [blame]	480	int16_t* const* out) {
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	481	// Apply gain
				482	// handle first sub frame separately
Per Åhgren	77dc199	2019-11-23 00:14:31 +0100	[diff] [blame]	483	size_t L;
				484	int16_t L2; // samples/subframe
				485
				486	// determine number of samples per ms
				487	if (FS == 8000) {
				488	L = 8;
				489	L2 = 3;
				490	} else if (FS == 16000 \|\| FS == 32000 \|\| FS == 48000) {
				491	L = 16;
				492	L2 = 4;
				493	} else {
				494	return -1;
				495	}
				496
				497	for (size_t i = 0; i < num_bands; ++i) {
				498	if (in_near[i] != out[i]) {
				499	// Only needed if they don't already point to the same place.
				500	memcpy(out[i], in_near[i], 10 * L * sizeof(in_near[i][0]));
				501	}
				502	}
				503
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	504	// iterate over samples
Per Åhgren	77dc199	2019-11-23 00:14:31 +0100	[diff] [blame]	505	int32_t delta = (gains[1] - gains[0]) * (1 << (4 - L2));
				506	int32_t gain32 = gains[0] * (1 << 4);
				507	for (size_t n = 0; n < L; n++) {
				508	for (size_t i = 0; i < num_bands; ++i) {
				509	int32_t out_tmp = (int64_t)out[i][n] * ((gain32 + 127) >> 7) >> 16;
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	510	if (out_tmp > 4095) {
				511	out[i][n] = (int16_t)32767;
				512	} else if (out_tmp < -4096) {
				513	out[i][n] = (int16_t)-32768;
				514	} else {
Per Åhgren	77dc199	2019-11-23 00:14:31 +0100	[diff] [blame]	515	int32_t tmp32 = ((int64_t)out[i][n] * (gain32 >> 4)) >> 16;
Sam Zackrisson	46f858a	2018-07-02 15:01:11 +0200	[diff] [blame]	516	out[i][n] = (int16_t)tmp32;
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	517	}
				518	}
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	519
				520	gain32 += delta;
				521	}
				522	// iterate over subframes
Per Åhgren	77dc199	2019-11-23 00:14:31 +0100	[diff] [blame]	523	for (int k = 1; k < 10; k++) {
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	524	delta = (gains[k + 1] - gains[k]) * (1 << (4 - L2));
				525	gain32 = gains[k] * (1 << 4);
				526	// iterate over samples
Per Åhgren	77dc199	2019-11-23 00:14:31 +0100	[diff] [blame]	527	for (size_t n = 0; n < L; n++) {
				528	for (size_t i = 0; i < num_bands; ++i) {
peah	fb2fa3f	2017-09-13 06:28:16 -0700	[diff] [blame]	529	int64_t tmp64 = ((int64_t)(out[i][k * L + n])) * (gain32 >> 4);
				530	tmp64 = tmp64 >> 16;
				531	if (tmp64 > 32767) {
				532	out[i][k * L + n] = 32767;
Per Åhgren	5b139d6	2020-03-20 15:50:14 +0100	[diff] [blame]	533	} else if (tmp64 < -32768) {
peah	fb2fa3f	2017-09-13 06:28:16 -0700	[diff] [blame]	534	out[i][k * L + n] = -32768;
Per Åhgren	5b139d6	2020-03-20 15:50:14 +0100	[diff] [blame]	535	} else {
peah	fb2fa3f	2017-09-13 06:28:16 -0700	[diff] [blame]	536	out[i][k * L + n] = (int16_t)(tmp64);
				537	}
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	538	}
				539	gain32 += delta;
				540	}
				541	}
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	542	return 0;
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	543	}
				544
pbos@webrtc.org	e468bc9	2014-12-18 09:11:33 +0000	[diff] [blame]	545	void WebRtcAgc_InitVad(AgcVad* state) {
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	546	int16_t k;
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	547
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	548	state->HPstate = 0; // state of high pass filter
				549	state->logRatio = 0; // log( P(active) / P(inactive) )
				550	// average input level (Q10)
				551	state->meanLongTerm = 15 << 10;
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	552
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	553	// variance of input level (Q8)
				554	state->varianceLongTerm = 500 << 8;
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	555
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	556	state->stdLongTerm = 0; // standard deviation of input level in dB
				557	// short-term average input level (Q10)
				558	state->meanShortTerm = 15 << 10;
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	559
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	560	// short-term variance of input level (Q8)
				561	state->varianceShortTerm = 500 << 8;
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	562
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	563	state->stdShortTerm =
				564	0; // short-term standard deviation of input level in dB
				565	state->counter = 3; // counts updates
				566	for (k = 0; k < 8; k++) {
				567	// downsampling filter
				568	state->downState[k] = 0;
				569	}
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	570	}
				571
Per Åhgren	5b139d6	2020-03-20 15:50:14 +0100	[diff] [blame]	572	int16_t WebRtcAgc_ProcessVad(AgcVad* state, // (i) VAD state
				573	const int16_t* in, // (i) Speech signal
				574	size_t nrSamples) { // (i) number of samples
Alex Loiko	c7b18fe	2017-10-27 14:57:38 +0200	[diff] [blame]	575	uint32_t nrg;
				576	int32_t out, tmp32, tmp32b;
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	577	uint16_t tmpU16;
				578	int16_t k, subfr, tmp16;
				579	int16_t buf1[8];
				580	int16_t buf2[4];
				581	int16_t HPstate;
				582	int16_t zeros, dB;
Alex Loiko	e714ed6	2018-07-19 13:08:23 +0200	[diff] [blame]	583	int64_t tmp64;
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	584
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	585	// process in 10 sub frames of 1 ms (to save on memory)
				586	nrg = 0;
				587	HPstate = state->HPstate;
				588	for (subfr = 0; subfr < 10; subfr++) {
				589	// downsample to 4 kHz
				590	if (nrSamples == 160) {
				591	for (k = 0; k < 8; k++) {
				592	tmp32 = (int32_t)in[2 * k] + (int32_t)in[2 * k + 1];
				593	tmp32 >>= 1;
				594	buf1[k] = (int16_t)tmp32;
				595	}
				596	in += 16;
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	597
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	598	WebRtcSpl_DownsampleBy2(buf1, 8, buf2, state->downState);
				599	} else {
				600	WebRtcSpl_DownsampleBy2(in, 8, buf2, state->downState);
				601	in += 8;
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	602	}
				603
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	604	// high pass filter and compute energy
				605	for (k = 0; k < 4; k++) {
				606	out = buf2[k] + HPstate;
				607	tmp32 = 600 * out;
				608	HPstate = (int16_t)((tmp32 >> 10) - buf2[k]);
Alex Loiko	7cfbf3a	2017-11-07 16:34:32 +0100	[diff] [blame]	609
				610	// Add 'out * out / 2**6' to 'nrg' in a non-overflowing
				611	// way. Guaranteed to work as long as 'out * out / 2**6' fits in
				612	// an int32_t.
				613	nrg += out * (out / (1 << 6));
				614	nrg += out * (out % (1 << 6)) / (1 << 6);
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	615	}
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	616	}
				617	state->HPstate = HPstate;
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	618
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	619	// find number of leading zeros
				620	if (!(0xFFFF0000 & nrg)) {
				621	zeros = 16;
				622	} else {
				623	zeros = 0;
				624	}
				625	if (!(0xFF000000 & (nrg << zeros))) {
				626	zeros += 8;
				627	}
				628	if (!(0xF0000000 & (nrg << zeros))) {
				629	zeros += 4;
				630	}
				631	if (!(0xC0000000 & (nrg << zeros))) {
				632	zeros += 2;
				633	}
				634	if (!(0x80000000 & (nrg << zeros))) {
				635	zeros += 1;
				636	}
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	637
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	638	// energy level (range {-32..30}) (Q10)
Alex Loiko	b9f5361	2017-10-24 09:58:00 +0200	[diff] [blame]	639	dB = (15 - zeros) * (1 << 11);
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	640
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	641	// Update statistics
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	642
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	643	if (state->counter < kAvgDecayTime) {
				644	// decay time = AvgDecTime * 10 ms
				645	state->counter++;
				646	}
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	647
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	648	// update short-term estimate of mean energy level (Q10)
				649	tmp32 = state->meanShortTerm * 15 + dB;
				650	state->meanShortTerm = (int16_t)(tmp32 >> 4);
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	651
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	652	// update short-term estimate of variance in energy level (Q8)
				653	tmp32 = (dB * dB) >> 12;
				654	tmp32 += state->varianceShortTerm * 15;
				655	state->varianceShortTerm = tmp32 / 16;
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	656
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	657	// update short-term estimate of standard deviation in energy level (Q10)
				658	tmp32 = state->meanShortTerm * state->meanShortTerm;
				659	tmp32 = (state->varianceShortTerm << 12) - tmp32;
				660	state->stdShortTerm = (int16_t)WebRtcSpl_Sqrt(tmp32);
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	661
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	662	// update long-term estimate of mean energy level (Q10)
				663	tmp32 = state->meanLongTerm * state->counter + dB;
				664	state->meanLongTerm =
				665	WebRtcSpl_DivW32W16ResW16(tmp32, WebRtcSpl_AddSatW16(state->counter, 1));
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	666
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	667	// update long-term estimate of variance in energy level (Q8)
				668	tmp32 = (dB * dB) >> 12;
				669	tmp32 += state->varianceLongTerm * state->counter;
				670	state->varianceLongTerm =
				671	WebRtcSpl_DivW32W16(tmp32, WebRtcSpl_AddSatW16(state->counter, 1));
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	672
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	673	// update long-term estimate of standard deviation in energy level (Q10)
				674	tmp32 = state->meanLongTerm * state->meanLongTerm;
				675	tmp32 = (state->varianceLongTerm << 12) - tmp32;
				676	state->stdLongTerm = (int16_t)WebRtcSpl_Sqrt(tmp32);
				677
				678	// update voice activity measure (Q10)
				679	tmp16 = 3 << 12;
				680	// TODO(bjornv): (dB - state->meanLongTerm) can overflow, e.g., in
				681	// ApmTest.Process unit test. Previously the macro WEBRTC_SPL_MUL_16_16()
				682	// was used, which did an intermediate cast to (int16_t), hence losing
				683	// significant bits. This cause logRatio to max out positive, rather than
				684	// negative. This is a bug, but has very little significance.
				685	tmp32 = tmp16 * (int16_t)(dB - state->meanLongTerm);
				686	tmp32 = WebRtcSpl_DivW32W16(tmp32, state->stdLongTerm);
				687	tmpU16 = (13 << 12);
				688	tmp32b = WEBRTC_SPL_MUL_16_U16(state->logRatio, tmpU16);
Alex Loiko	e714ed6	2018-07-19 13:08:23 +0200	[diff] [blame]	689	tmp64 = tmp32;
				690	tmp64 += tmp32b >> 10;
				691	tmp64 >>= 6;
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	692
				693	// limit
Alex Loiko	e714ed6	2018-07-19 13:08:23 +0200	[diff] [blame]	694	if (tmp64 > 2048) {
				695	tmp64 = 2048;
				696	} else if (tmp64 < -2048) {
				697	tmp64 = -2048;
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	698	}
Alex Loiko	e714ed6	2018-07-19 13:08:23 +0200	[diff] [blame]	699	state->logRatio = (int16_t)tmp64;
minyue	cac94aa	2016-05-20 08:42:22 -0700	[diff] [blame]	700
				701	return state->logRatio; // Q10
niklase@google.com	470e71d	2011-07-07 08:21:25 +0000	[diff] [blame]	702	}
Per Åhgren	5b139d6	2020-03-20 15:50:14 +0100	[diff] [blame]	703
				704	} // namespace webrtc