blob: 4191c03e0faf32f6dd2f5c019f6e3b052c8ea034 [file] [log] [blame]
niklase@google.com470e71d2011-07-07 08:21:25 +00001/*
bjornv@webrtc.orga496b032012-03-20 12:53:06 +00002 * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
niklase@google.com470e71d2011-07-07 08:21:25 +00003 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
pbos@webrtc.orgaa30bb72013-05-27 09:49:58 +000011#include "webrtc/common_audio/vad/vad_sp.h"
bjornv@webrtc.org2111d3b2011-10-14 12:58:34 +000012
ehmaldonadoeaaae9e2017-07-07 03:09:51 -070013#include "webrtc/rtc_base/checks.h"
pbos@webrtc.orgaa30bb72013-05-27 09:49:58 +000014#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
15#include "webrtc/common_audio/vad/vad_core.h"
16#include "webrtc/typedefs.h"
bjornv@webrtc.org2111d3b2011-10-14 12:58:34 +000017
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +000018// Allpass filter coefficients, upper and lower, in Q13.
19// Upper: 0.64, Lower: 0.17.
bjornv@webrtc.orga496b032012-03-20 12:53:06 +000020static const int16_t kAllPassCoefsQ13[2] = { 5243, 1392 }; // Q13.
21static const int16_t kSmoothingDown = 6553; // 0.2 in Q15.
22static const int16_t kSmoothingUp = 32439; // 0.99 in Q15.
niklase@google.com470e71d2011-07-07 08:21:25 +000023
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +000024// TODO(bjornv): Move this function to vad_filterbank.c.
25// Downsampling filter based on splitting filter and allpass functions.
andrew@webrtc.org65f93382014-04-30 16:44:13 +000026void WebRtcVad_Downsampling(const int16_t* signal_in,
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +000027 int16_t* signal_out,
28 int32_t* filter_state,
Peter Kastingdce40cf2015-08-24 14:52:23 -070029 size_t in_length) {
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +000030 int16_t tmp16_1 = 0, tmp16_2 = 0;
31 int32_t tmp32_1 = filter_state[0];
32 int32_t tmp32_2 = filter_state[1];
Peter Kastingdce40cf2015-08-24 14:52:23 -070033 size_t n = 0;
34 // Downsampling by 2 gives half length.
35 size_t half_length = (in_length >> 1);
niklase@google.com470e71d2011-07-07 08:21:25 +000036
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +000037 // Filter coefficients in Q13, filter state in Q0.
38 for (n = 0; n < half_length; n++) {
39 // All-pass filtering upper branch.
40 tmp16_1 = (int16_t) ((tmp32_1 >> 1) +
Bjorn Volcker3fbf99c2015-03-25 14:37:24 +010041 ((kAllPassCoefsQ13[0] * *signal_in) >> 14));
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +000042 *signal_out = tmp16_1;
Bjorn Volcker3fbf99c2015-03-25 14:37:24 +010043 tmp32_1 = (int32_t)(*signal_in++) - ((kAllPassCoefsQ13[0] * tmp16_1) >> 12);
niklase@google.com470e71d2011-07-07 08:21:25 +000044
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +000045 // All-pass filtering lower branch.
46 tmp16_2 = (int16_t) ((tmp32_2 >> 1) +
Bjorn Volcker3fbf99c2015-03-25 14:37:24 +010047 ((kAllPassCoefsQ13[1] * *signal_in) >> 14));
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +000048 *signal_out++ += tmp16_2;
Bjorn Volcker3fbf99c2015-03-25 14:37:24 +010049 tmp32_2 = (int32_t)(*signal_in++) - ((kAllPassCoefsQ13[1] * tmp16_2) >> 12);
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +000050 }
51 // Store the filter states.
52 filter_state[0] = tmp32_1;
53 filter_state[1] = tmp32_2;
niklase@google.com470e71d2011-07-07 08:21:25 +000054}
55
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +000056// Inserts |feature_value| into |low_value_vector|, if it is one of the 16
57// smallest values the last 100 frames. Then calculates and returns the median
58// of the five smallest values.
59int16_t WebRtcVad_FindMinimum(VadInstT* self,
60 int16_t feature_value,
61 int channel) {
62 int i = 0, j = 0;
63 int position = -1;
64 // Offset to beginning of the 16 minimum values in memory.
bjornv@webrtc.orgeec739f2012-06-11 07:57:57 +000065 const int offset = (channel << 4);
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +000066 int16_t current_median = 1600;
67 int16_t alpha = 0;
68 int32_t tmp32 = 0;
69 // Pointer to memory for the 16 minimum values and the age of each value of
70 // the |channel|.
bjornv@webrtc.orgeec739f2012-06-11 07:57:57 +000071 int16_t* age = &self->index_vector[offset];
72 int16_t* smallest_values = &self->low_value_vector[offset];
niklase@google.com470e71d2011-07-07 08:21:25 +000073
kwiberg1e8ed4a2016-08-26 04:33:34 -070074 RTC_DCHECK_LT(channel, kNumChannels);
niklase@google.com470e71d2011-07-07 08:21:25 +000075
bjornv@webrtc.orgeec739f2012-06-11 07:57:57 +000076 // Each value in |smallest_values| is getting 1 loop older. Update |age|, and
77 // remove old values.
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +000078 for (i = 0; i < 16; i++) {
bjornv@webrtc.orgeec739f2012-06-11 07:57:57 +000079 if (age[i] != 100) {
80 age[i]++;
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +000081 } else {
bjornv@webrtc.orgeec739f2012-06-11 07:57:57 +000082 // Too old value. Remove from memory and shift larger values downwards.
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +000083 for (j = i; j < 16; j++) {
bjornv@webrtc.orgeec739f2012-06-11 07:57:57 +000084 smallest_values[j] = smallest_values[j + 1];
85 age[j] = age[j + 1];
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +000086 }
bjornv@webrtc.orgeec739f2012-06-11 07:57:57 +000087 age[15] = 101;
88 smallest_values[15] = 10000;
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +000089 }
90 }
niklase@google.com470e71d2011-07-07 08:21:25 +000091
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +000092 // Check if |feature_value| is smaller than any of the values in
bjornv@webrtc.orgeec739f2012-06-11 07:57:57 +000093 // |smallest_values|. If so, find the |position| where to insert the new value
94 // (|feature_value|).
95 if (feature_value < smallest_values[7]) {
96 if (feature_value < smallest_values[3]) {
97 if (feature_value < smallest_values[1]) {
98 if (feature_value < smallest_values[0]) {
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +000099 position = 0;
100 } else {
101 position = 1;
niklase@google.com470e71d2011-07-07 08:21:25 +0000102 }
bjornv@webrtc.orgeec739f2012-06-11 07:57:57 +0000103 } else if (feature_value < smallest_values[2]) {
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +0000104 position = 2;
105 } else {
106 position = 3;
107 }
bjornv@webrtc.orgeec739f2012-06-11 07:57:57 +0000108 } else if (feature_value < smallest_values[5]) {
109 if (feature_value < smallest_values[4]) {
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +0000110 position = 4;
111 } else {
112 position = 5;
113 }
bjornv@webrtc.orgeec739f2012-06-11 07:57:57 +0000114 } else if (feature_value < smallest_values[6]) {
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +0000115 position = 6;
116 } else {
117 position = 7;
niklase@google.com470e71d2011-07-07 08:21:25 +0000118 }
bjornv@webrtc.orgeec739f2012-06-11 07:57:57 +0000119 } else if (feature_value < smallest_values[15]) {
120 if (feature_value < smallest_values[11]) {
121 if (feature_value < smallest_values[9]) {
122 if (feature_value < smallest_values[8]) {
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +0000123 position = 8;
124 } else {
125 position = 9;
niklase@google.com470e71d2011-07-07 08:21:25 +0000126 }
bjornv@webrtc.orgeec739f2012-06-11 07:57:57 +0000127 } else if (feature_value < smallest_values[10]) {
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +0000128 position = 10;
129 } else {
130 position = 11;
131 }
bjornv@webrtc.orgeec739f2012-06-11 07:57:57 +0000132 } else if (feature_value < smallest_values[13]) {
133 if (feature_value < smallest_values[12]) {
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +0000134 position = 12;
135 } else {
136 position = 13;
137 }
bjornv@webrtc.orgeec739f2012-06-11 07:57:57 +0000138 } else if (feature_value < smallest_values[14]) {
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +0000139 position = 14;
140 } else {
141 position = 15;
niklase@google.com470e71d2011-07-07 08:21:25 +0000142 }
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +0000143 }
niklase@google.com470e71d2011-07-07 08:21:25 +0000144
bjornv@webrtc.orgeec739f2012-06-11 07:57:57 +0000145 // If we have detected a new small value, insert it at the correct position
146 // and shift larger values up.
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +0000147 if (position > -1) {
148 for (i = 15; i > position; i--) {
bjornv@webrtc.orgeec739f2012-06-11 07:57:57 +0000149 smallest_values[i] = smallest_values[i - 1];
150 age[i] = age[i - 1];
niklase@google.com470e71d2011-07-07 08:21:25 +0000151 }
bjornv@webrtc.orgeec739f2012-06-11 07:57:57 +0000152 smallest_values[position] = feature_value;
153 age[position] = 1;
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +0000154 }
niklase@google.com470e71d2011-07-07 08:21:25 +0000155
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +0000156 // Get |current_median|.
157 if (self->frame_counter > 2) {
bjornv@webrtc.orgeec739f2012-06-11 07:57:57 +0000158 current_median = smallest_values[2];
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +0000159 } else if (self->frame_counter > 0) {
bjornv@webrtc.orgeec739f2012-06-11 07:57:57 +0000160 current_median = smallest_values[0];
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +0000161 }
162
163 // Smooth the median value.
164 if (self->frame_counter > 0) {
165 if (current_median < self->mean_value[channel]) {
bjornv@webrtc.orga496b032012-03-20 12:53:06 +0000166 alpha = kSmoothingDown; // 0.2 in Q15.
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +0000167 } else {
bjornv@webrtc.orga496b032012-03-20 12:53:06 +0000168 alpha = kSmoothingUp; // 0.99 in Q15.
niklase@google.com470e71d2011-07-07 08:21:25 +0000169 }
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +0000170 }
bjornv@webrtc.orgd25c0342015-01-26 15:32:47 +0000171 tmp32 = (alpha + 1) * self->mean_value[channel];
172 tmp32 += (WEBRTC_SPL_WORD16_MAX - alpha) * current_median;
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +0000173 tmp32 += 16384;
174 self->mean_value[channel] = (int16_t) (tmp32 >> 15);
niklase@google.com470e71d2011-07-07 08:21:25 +0000175
bjornv@webrtc.org226c5a12012-01-04 09:15:12 +0000176 return self->mean_value[channel];
niklase@google.com470e71d2011-07-07 08:21:25 +0000177}