blob: 4d327652c680172752b9f67310024b156e050355 [file] [log] [blame]
pbos@webrtc.org788acd12014-12-15 09:41:24 +00001/*
2 * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020011#ifndef MODULES_AUDIO_PROCESSING_VAD_PITCH_BASED_VAD_H_
12#define MODULES_AUDIO_PROCESSING_VAD_PITCH_BASED_VAD_H_
pbos@webrtc.org788acd12014-12-15 09:41:24 +000013
kwibergdabf07f2016-02-17 07:59:48 -080014#include <memory>
15
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020016#include "modules/audio_processing/vad/common.h"
17#include "modules/audio_processing/vad/gmm.h"
pbos@webrtc.org788acd12014-12-15 09:41:24 +000018
19namespace webrtc {
20
21class AudioFrame;
aluebsecf6b812015-06-25 12:28:48 -070022class VadCircularBuffer;
pbos@webrtc.org788acd12014-12-15 09:41:24 +000023
24// Computes the probability of the input audio frame to be active given
25// the corresponding pitch-gain and lag of the frame.
26class PitchBasedVad {
27 public:
28 PitchBasedVad();
29 ~PitchBasedVad();
30
31 // Compute pitch-based voicing probability, given the features.
32 // features: a structure containing features required for computing voicing
33 // probabilities.
34 //
35 // p_combined: an array which contains the combined activity probabilities
36 // computed prior to the call of this function. The method,
37 // then, computes the voicing probabilities and combine them
38 // with the given values. The result are returned in |p|.
39 int VoicingProbability(const AudioFeatures& features, double* p_combined);
aluebsecf6b812015-06-25 12:28:48 -070040
pbos@webrtc.org788acd12014-12-15 09:41:24 +000041 private:
42 int UpdatePrior(double p);
43
44 // TODO(turajs): maybe defining this at a higher level (maybe enum) so that
45 // all the code recognize it as "no-error."
46 static const int kNoError = 0;
47
48 GmmParameters noise_gmm_;
49 GmmParameters voice_gmm_;
50
51 double p_prior_;
52
kwibergdabf07f2016-02-17 07:59:48 -080053 std::unique_ptr<VadCircularBuffer> circular_buffer_;
pbos@webrtc.org788acd12014-12-15 09:41:24 +000054};
55
56} // namespace webrtc
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020057#endif // MODULES_AUDIO_PROCESSING_VAD_PITCH_BASED_VAD_H_