blob: 3b31ef51f7790b786f4d792eaabff0ec7b851214 [file] [log] [blame]
niklase@google.com470e71d2011-07-07 08:21:25 +00001/*
bjornv@webrtc.org152c34c2012-01-23 12:36:46 +00002 * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
niklase@google.com470e71d2011-07-07 08:21:25 +00003 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
pbos@webrtc.orgaa30bb72013-05-27 09:49:58 +000011#include "webrtc/common_audio/vad/include/webrtc_vad.h"
bjornv@webrtc.orgb1c32762012-06-12 08:19:24 +000012
niklase@google.com470e71d2011-07-07 08:21:25 +000013#include <stdlib.h>
14#include <string.h>
15
pbos@webrtc.orgaa30bb72013-05-27 09:49:58 +000016#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
17#include "webrtc/common_audio/vad/vad_core.h"
18#include "webrtc/typedefs.h"
niklase@google.com470e71d2011-07-07 08:21:25 +000019
20static const int kInitCheck = 42;
tina.legrand@webrtc.orgef433572012-10-15 17:46:19 +000021static const int kValidRates[] = { 8000, 16000, 32000, 48000 };
bjornv@webrtc.orgb1c32762012-06-12 08:19:24 +000022static const size_t kRatesSize = sizeof(kValidRates) / sizeof(*kValidRates);
23static const int kMaxFrameLengthMs = 30;
niklase@google.com470e71d2011-07-07 08:21:25 +000024
bjornv@webrtc.org26e8a582012-01-31 14:42:50 +000025int WebRtcVad_Create(VadInst** handle) {
26 VadInstT* self = NULL;
niklase@google.com470e71d2011-07-07 08:21:25 +000027
bjornv@webrtc.org26e8a582012-01-31 14:42:50 +000028 if (handle == NULL) {
29 return -1;
30 }
niklase@google.com470e71d2011-07-07 08:21:25 +000031
bjornv@webrtc.org26e8a582012-01-31 14:42:50 +000032 *handle = NULL;
33 self = (VadInstT*) malloc(sizeof(VadInstT));
34 *handle = (VadInst*) self;
niklase@google.com470e71d2011-07-07 08:21:25 +000035
bjornv@webrtc.org26e8a582012-01-31 14:42:50 +000036 if (self == NULL) {
37 return -1;
38 }
niklase@google.com470e71d2011-07-07 08:21:25 +000039
kma@webrtc.orgac4d70d2012-10-05 00:19:01 +000040 WebRtcSpl_Init();
41
bjornv@webrtc.org26e8a582012-01-31 14:42:50 +000042 self->init_flag = 0;
niklase@google.com470e71d2011-07-07 08:21:25 +000043
bjornv@webrtc.org26e8a582012-01-31 14:42:50 +000044 return 0;
niklase@google.com470e71d2011-07-07 08:21:25 +000045}
46
bjornv@webrtc.org2a796722014-04-22 04:45:35 +000047void WebRtcVad_Free(VadInst* handle) {
bjornv@webrtc.org26e8a582012-01-31 14:42:50 +000048 free(handle);
niklase@google.com470e71d2011-07-07 08:21:25 +000049}
50
bjornv@webrtc.orged700db2012-03-12 12:17:26 +000051// TODO(bjornv): Move WebRtcVad_InitCore() code here.
bjornv@webrtc.org2a4dcd72012-01-25 12:18:12 +000052int WebRtcVad_Init(VadInst* handle) {
53 // Initialize the core VAD component.
54 return WebRtcVad_InitCore((VadInstT*) handle);
niklase@google.com470e71d2011-07-07 08:21:25 +000055}
56
bjornv@webrtc.org78f0cdc2012-03-27 11:06:29 +000057// TODO(bjornv): Move WebRtcVad_set_mode_core() code here.
58int WebRtcVad_set_mode(VadInst* handle, int mode) {
59 VadInstT* self = (VadInstT*) handle;
niklase@google.com470e71d2011-07-07 08:21:25 +000060
bjornv@webrtc.org78f0cdc2012-03-27 11:06:29 +000061 if (handle == NULL) {
62 return -1;
63 }
64 if (self->init_flag != kInitCheck) {
65 return -1;
66 }
niklase@google.com470e71d2011-07-07 08:21:25 +000067
bjornv@webrtc.org78f0cdc2012-03-27 11:06:29 +000068 return WebRtcVad_set_mode_core(self, mode);
niklase@google.com470e71d2011-07-07 08:21:25 +000069}
70
bjornv@webrtc.orgb38fca12012-06-19 11:03:32 +000071int WebRtcVad_Process(VadInst* handle, int fs, int16_t* audio_frame,
72 int frame_length) {
73 int vad = -1;
bjornv@webrtc.orgb1c32762012-06-12 08:19:24 +000074 VadInstT* self = (VadInstT*) handle;
niklase@google.com470e71d2011-07-07 08:21:25 +000075
bjornv@webrtc.orgb1c32762012-06-12 08:19:24 +000076 if (handle == NULL) {
77 return -1;
78 }
niklase@google.com470e71d2011-07-07 08:21:25 +000079
bjornv@webrtc.orgb1c32762012-06-12 08:19:24 +000080 if (self->init_flag != kInitCheck) {
81 return -1;
82 }
83 if (audio_frame == NULL) {
84 return -1;
85 }
86 if (WebRtcVad_ValidRateAndFrameLength(fs, frame_length) != 0) {
87 return -1;
88 }
niklase@google.com470e71d2011-07-07 08:21:25 +000089
tina.legrand@webrtc.orgef433572012-10-15 17:46:19 +000090 if (fs == 48000) {
91 vad = WebRtcVad_CalcVad48khz(self, audio_frame, frame_length);
92 } else if (fs == 32000) {
bjornv@webrtc.orgb1c32762012-06-12 08:19:24 +000093 vad = WebRtcVad_CalcVad32khz(self, audio_frame, frame_length);
94 } else if (fs == 16000) {
95 vad = WebRtcVad_CalcVad16khz(self, audio_frame, frame_length);
96 } else if (fs == 8000) {
97 vad = WebRtcVad_CalcVad8khz(self, audio_frame, frame_length);
98 }
niklase@google.com470e71d2011-07-07 08:21:25 +000099
bjornv@webrtc.orgb1c32762012-06-12 08:19:24 +0000100 if (vad > 0) {
101 vad = 1;
102 }
103 return vad;
104}
105
106int WebRtcVad_ValidRateAndFrameLength(int rate, int frame_length) {
107 int return_value = -1;
108 size_t i;
109 int valid_length_ms;
110 int valid_length;
111
112 // We only allow 10, 20 or 30 ms frames. Loop through valid frame rates and
113 // see if we have a matching pair.
114 for (i = 0; i < kRatesSize; i++) {
115 if (kValidRates[i] == rate) {
116 for (valid_length_ms = 10; valid_length_ms <= kMaxFrameLengthMs;
117 valid_length_ms += 10) {
118 valid_length = (kValidRates[i] / 1000 * valid_length_ms);
119 if (frame_length == valid_length) {
120 return_value = 0;
121 break;
niklase@google.com470e71d2011-07-07 08:21:25 +0000122 }
bjornv@webrtc.orgb1c32762012-06-12 08:19:24 +0000123 }
124 break;
niklase@google.com470e71d2011-07-07 08:21:25 +0000125 }
bjornv@webrtc.orgb1c32762012-06-12 08:19:24 +0000126 }
niklase@google.com470e71d2011-07-07 08:21:25 +0000127
bjornv@webrtc.orgb1c32762012-06-12 08:19:24 +0000128 return return_value;
niklase@google.com470e71d2011-07-07 08:21:25 +0000129}