blob: 22bc0f2263901007e2afda78aaa0c66ba44e6ceb [file] [log] [blame]
pbos@webrtc.org788acd12014-12-15 09:41:24 +00001/*
2 * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020011#ifndef MODULES_AUDIO_PROCESSING_VAD_PITCH_BASED_VAD_H_
12#define MODULES_AUDIO_PROCESSING_VAD_PITCH_BASED_VAD_H_
pbos@webrtc.org788acd12014-12-15 09:41:24 +000013
kwibergdabf07f2016-02-17 07:59:48 -080014#include <memory>
15
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020016#include "modules/audio_processing/vad/common.h"
17#include "modules/audio_processing/vad/gmm.h"
pbos@webrtc.org788acd12014-12-15 09:41:24 +000018
19namespace webrtc {
20
aluebsecf6b812015-06-25 12:28:48 -070021class VadCircularBuffer;
pbos@webrtc.org788acd12014-12-15 09:41:24 +000022
23// Computes the probability of the input audio frame to be active given
24// the corresponding pitch-gain and lag of the frame.
25class PitchBasedVad {
26 public:
27 PitchBasedVad();
28 ~PitchBasedVad();
29
30 // Compute pitch-based voicing probability, given the features.
31 // features: a structure containing features required for computing voicing
32 // probabilities.
33 //
34 // p_combined: an array which contains the combined activity probabilities
35 // computed prior to the call of this function. The method,
36 // then, computes the voicing probabilities and combine them
37 // with the given values. The result are returned in |p|.
38 int VoicingProbability(const AudioFeatures& features, double* p_combined);
aluebsecf6b812015-06-25 12:28:48 -070039
pbos@webrtc.org788acd12014-12-15 09:41:24 +000040 private:
41 int UpdatePrior(double p);
42
43 // TODO(turajs): maybe defining this at a higher level (maybe enum) so that
44 // all the code recognize it as "no-error."
45 static const int kNoError = 0;
46
47 GmmParameters noise_gmm_;
48 GmmParameters voice_gmm_;
49
50 double p_prior_;
51
kwibergdabf07f2016-02-17 07:59:48 -080052 std::unique_ptr<VadCircularBuffer> circular_buffer_;
pbos@webrtc.org788acd12014-12-15 09:41:24 +000053};
54
55} // namespace webrtc
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020056#endif // MODULES_AUDIO_PROCESSING_VAD_PITCH_BASED_VAD_H_