pbos@webrtc.org | 788acd1 | 2014-12-15 09:41:24 +0000 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved. |
| 3 | * |
| 4 | * Use of this source code is governed by a BSD-style license |
| 5 | * that can be found in the LICENSE file in the root of the source |
| 6 | * tree. An additional intellectual property rights grant can be found |
| 7 | * in the file PATENTS. All contributing project authors may |
| 8 | * be found in the AUTHORS file in the root of the source tree. |
| 9 | */ |
| 10 | |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 11 | #include "modules/audio_processing/vad/standalone_vad.h" |
pbos@webrtc.org | 788acd1 | 2014-12-15 09:41:24 +0000 | [diff] [blame] | 12 | |
| 13 | #include <string.h> |
| 14 | |
kwiberg | dabf07f | 2016-02-17 07:59:48 -0800 | [diff] [blame] | 15 | #include <memory> |
| 16 | |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 17 | #include "test/gtest.h" |
| 18 | #include "test/testsupport/fileutils.h" |
pbos@webrtc.org | 788acd1 | 2014-12-15 09:41:24 +0000 | [diff] [blame] | 19 | |
| 20 | namespace webrtc { |
| 21 | |
| 22 | TEST(StandaloneVadTest, Api) { |
kwiberg | dabf07f | 2016-02-17 07:59:48 -0800 | [diff] [blame] | 23 | std::unique_ptr<StandaloneVad> vad(StandaloneVad::Create()); |
aluebs | ecf6b81 | 2015-06-25 12:28:48 -0700 | [diff] [blame] | 24 | int16_t data[kLength10Ms] = {0}; |
pbos@webrtc.org | 788acd1 | 2014-12-15 09:41:24 +0000 | [diff] [blame] | 25 | |
| 26 | // Valid frame length (for 32 kHz rate), but not what the VAD is expecting. |
| 27 | EXPECT_EQ(-1, vad->AddAudio(data, 320)); |
| 28 | |
Peter Kasting | dce40cf | 2015-08-24 14:52:23 -0700 | [diff] [blame] | 29 | const size_t kMaxNumFrames = 3; |
pbos@webrtc.org | 788acd1 | 2014-12-15 09:41:24 +0000 | [diff] [blame] | 30 | double p[kMaxNumFrames]; |
Peter Kasting | dce40cf | 2015-08-24 14:52:23 -0700 | [diff] [blame] | 31 | for (size_t n = 0; n < kMaxNumFrames; n++) |
pbos@webrtc.org | 788acd1 | 2014-12-15 09:41:24 +0000 | [diff] [blame] | 32 | EXPECT_EQ(0, vad->AddAudio(data, kLength10Ms)); |
| 33 | |
| 34 | // Pretend |p| is shorter that it should be. |
| 35 | EXPECT_EQ(-1, vad->GetActivity(p, kMaxNumFrames - 1)); |
| 36 | |
| 37 | EXPECT_EQ(0, vad->GetActivity(p, kMaxNumFrames)); |
| 38 | |
| 39 | // Ask for activity when buffer is empty. |
| 40 | EXPECT_EQ(-1, vad->GetActivity(p, kMaxNumFrames)); |
| 41 | |
| 42 | // Should reset and result in one buffer. |
Peter Kasting | dce40cf | 2015-08-24 14:52:23 -0700 | [diff] [blame] | 43 | for (size_t n = 0; n < kMaxNumFrames + 1; n++) |
pbos@webrtc.org | 788acd1 | 2014-12-15 09:41:24 +0000 | [diff] [blame] | 44 | EXPECT_EQ(0, vad->AddAudio(data, kLength10Ms)); |
| 45 | EXPECT_EQ(0, vad->GetActivity(p, 1)); |
| 46 | |
| 47 | // Wrong modes |
| 48 | EXPECT_EQ(-1, vad->set_mode(-1)); |
| 49 | EXPECT_EQ(-1, vad->set_mode(4)); |
| 50 | |
| 51 | // Valid mode. |
| 52 | const int kMode = 2; |
| 53 | EXPECT_EQ(0, vad->set_mode(kMode)); |
| 54 | EXPECT_EQ(kMode, vad->mode()); |
| 55 | } |
| 56 | |
Peter Boström | e2976c8 | 2016-01-04 22:44:05 +0100 | [diff] [blame] | 57 | #if defined(WEBRTC_IOS) |
| 58 | TEST(StandaloneVadTest, DISABLED_ActivityDetection) { |
| 59 | #else |
| 60 | TEST(StandaloneVadTest, ActivityDetection) { |
| 61 | #endif |
kwiberg | dabf07f | 2016-02-17 07:59:48 -0800 | [diff] [blame] | 62 | std::unique_ptr<StandaloneVad> vad(StandaloneVad::Create()); |
pbos@webrtc.org | 788acd1 | 2014-12-15 09:41:24 +0000 | [diff] [blame] | 63 | const size_t kDataLength = kLength10Ms; |
aluebs | ecf6b81 | 2015-06-25 12:28:48 -0700 | [diff] [blame] | 64 | int16_t data[kDataLength] = {0}; |
pbos@webrtc.org | 788acd1 | 2014-12-15 09:41:24 +0000 | [diff] [blame] | 65 | |
| 66 | FILE* pcm_file = |
| 67 | fopen(test::ResourcePath("audio_processing/agc/agc_audio", "pcm").c_str(), |
| 68 | "rb"); |
| 69 | ASSERT_TRUE(pcm_file != NULL); |
| 70 | |
| 71 | FILE* reference_file = fopen( |
| 72 | test::ResourcePath("audio_processing/agc/agc_vad", "dat").c_str(), "rb"); |
| 73 | ASSERT_TRUE(reference_file != NULL); |
| 74 | |
| 75 | // Reference activities are prepared with 0 aggressiveness. |
| 76 | ASSERT_EQ(0, vad->set_mode(0)); |
| 77 | |
| 78 | // Stand-alone VAD can operate on 1, 2 or 3 frames of length 10 ms. The |
| 79 | // reference file is created for 30 ms frame. |
| 80 | const int kNumVadFramesToProcess = 3; |
| 81 | int num_frames = 0; |
| 82 | while (fread(data, sizeof(int16_t), kDataLength, pcm_file) == kDataLength) { |
| 83 | vad->AddAudio(data, kDataLength); |
| 84 | num_frames++; |
| 85 | if (num_frames == kNumVadFramesToProcess) { |
| 86 | num_frames = 0; |
| 87 | int referece_activity; |
| 88 | double p[kNumVadFramesToProcess]; |
| 89 | EXPECT_EQ(1u, fread(&referece_activity, sizeof(referece_activity), 1, |
| 90 | reference_file)); |
| 91 | int activity = vad->GetActivity(p, kNumVadFramesToProcess); |
| 92 | EXPECT_EQ(referece_activity, activity); |
| 93 | if (activity != 0) { |
| 94 | // When active, probabilities are set to 0.5. |
| 95 | for (int n = 0; n < kNumVadFramesToProcess; n++) |
| 96 | EXPECT_EQ(0.5, p[n]); |
| 97 | } else { |
| 98 | // When inactive, probabilities are set to 0.01. |
| 99 | for (int n = 0; n < kNumVadFramesToProcess; n++) |
| 100 | EXPECT_EQ(0.01, p[n]); |
| 101 | } |
| 102 | } |
| 103 | } |
| 104 | fclose(reference_file); |
| 105 | fclose(pcm_file); |
| 106 | } |
aluebs | ecf6b81 | 2015-06-25 12:28:48 -0700 | [diff] [blame] | 107 | } // namespace webrtc |