blob: edc74945db0ffa01bd35ca222394249c23e8eb58 [file] [log] [blame]
niklase@google.com470e71d2011-07-07 08:21:25 +00001/*
bjornv@webrtc.org152c34c2012-01-23 12:36:46 +00002 * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
niklase@google.com470e71d2011-07-07 08:21:25 +00003 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
11
12/*
13 * This header file includes the VAD API calls. Specific function calls are given below.
14 */
15
bjornv@webrtc.orgb1c32762012-06-12 08:19:24 +000016#ifndef WEBRTC_COMMON_AUDIO_VAD_INCLUDE_WEBRTC_VAD_H_ // NOLINT
bjornv@webrtc.org0c6f9312012-01-30 09:39:08 +000017#define WEBRTC_COMMON_AUDIO_VAD_INCLUDE_WEBRTC_VAD_H_
niklase@google.com470e71d2011-07-07 08:21:25 +000018
bjornv@webrtc.orgb1c32762012-06-12 08:19:24 +000019#include "typedefs.h" // NOLINT
niklase@google.com470e71d2011-07-07 08:21:25 +000020
21typedef struct WebRtcVadInst VadInst;
22
23#ifdef __cplusplus
bjornv@webrtc.orged700db2012-03-12 12:17:26 +000024extern "C" {
niklase@google.com470e71d2011-07-07 08:21:25 +000025#endif
26
bjornv@webrtc.org26e8a582012-01-31 14:42:50 +000027// Creates an instance to the VAD structure.
28//
29// - handle [o] : Pointer to the VAD instance that should be created.
30//
31// returns : 0 - (OK), -1 - (Error)
32int WebRtcVad_Create(VadInst** handle);
niklase@google.com470e71d2011-07-07 08:21:25 +000033
bjornv@webrtc.org26e8a582012-01-31 14:42:50 +000034// Frees the dynamic memory of a specified VAD instance.
35//
36// - handle [i] : Pointer to VAD instance that should be freed.
37//
38// returns : 0 - (OK), -1 - (NULL pointer in)
39int WebRtcVad_Free(VadInst* handle);
niklase@google.com470e71d2011-07-07 08:21:25 +000040
bjornv@webrtc.orged700db2012-03-12 12:17:26 +000041// Initializes a VAD instance.
42//
43// - handle [i/o] : Instance that should be initialized.
44//
45// returns : 0 - (OK),
bjornv@webrtc.org78f0cdc2012-03-27 11:06:29 +000046// -1 - (NULL pointer or Default mode could not be set).
bjornv@webrtc.orged700db2012-03-12 12:17:26 +000047int WebRtcVad_Init(VadInst* handle);
niklase@google.com470e71d2011-07-07 08:21:25 +000048
bjornv@webrtc.org78f0cdc2012-03-27 11:06:29 +000049// Sets the VAD operating mode. A more aggressive (higher mode) VAD is more
50// restrictive in reporting speech. Put in other words the probability of being
51// speech when the VAD returns 1 is increased with increasing mode. As a
52// consequence also the missed detection rate goes up.
53//
54// - handle [i/o] : VAD instance.
55// - mode [i] : Aggressiveness mode (0, 1, 2, or 3).
56//
57// returns : 0 - (OK),
58// -1 - (NULL pointer, mode could not be set or the VAD instance
59// has not been initialized).
60int WebRtcVad_set_mode(VadInst* handle, int mode);
niklase@google.com470e71d2011-07-07 08:21:25 +000061
bjornv@webrtc.orgb1c32762012-06-12 08:19:24 +000062// Calculates a VAD decision for the |audio_frame|. For valid sampling rates
63// frame lengths, see the description of WebRtcVad_ValidRatesAndFrameLengths().
64//
65// - handle [i/o] : VAD Instance. Needs to be initialized by
66// WebRtcVad_Init() before call.
67// - fs [i] : Sampling frequency (Hz): 8000, 16000, or 32000
68// - audio_frame [i] : Audio frame buffer.
69// - frame_length [i] : Length of audio frame buffer in number of samples.
70//
71// returns : 1 - (Active Voice),
72// 0 - (Non-active Voice),
73// -1 - (Error)
bjornv@webrtc.orgb38fca12012-06-19 11:03:32 +000074int WebRtcVad_Process(VadInst* handle, int fs, int16_t* audio_frame,
75 int frame_length);
niklase@google.com470e71d2011-07-07 08:21:25 +000076
bjornv@webrtc.orgb1c32762012-06-12 08:19:24 +000077// Checks for valid combinations of |rate| and |frame_length|. We support 10,
78// 20 and 30 ms frames and the rates 8000, 16000 and 32000 Hz.
79//
80// - rate [i] : Sampling frequency (Hz).
81// - frame_length [i] : Speech frame buffer length in number of samples.
82//
83// returns : 0 - (valid combination), -1 - (invalid combination)
84int WebRtcVad_ValidRateAndFrameLength(int rate, int frame_length);
85
niklase@google.com470e71d2011-07-07 08:21:25 +000086#ifdef __cplusplus
87}
88#endif
89
bjornv@webrtc.orgb1c32762012-06-12 08:19:24 +000090#endif // WEBRTC_COMMON_AUDIO_VAD_INCLUDE_WEBRTC_VAD_H_ // NOLINT