1 /* 2 * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved. 3 * 4 * Use of this source code is governed by a BSD-style license 5 * that can be found in the LICENSE file in the root of the source 6 * tree. An additional intellectual property rights grant can be found 7 * in the file PATENTS. All contributing project authors may 8 * be found in the AUTHORS file in the root of the source tree. 9 */ 10 11 #include "webrtc/modules/audio_processing/vad/standalone_vad.h" 12 13 #include <string.h> 14 15 #include "testing/gtest/include/gtest/gtest.h" 16 #include "webrtc/base/scoped_ptr.h" 17 #include "webrtc/modules/include/module_common_types.h" 18 #include "webrtc/test/testsupport/fileutils.h" 19 20 namespace webrtc { 21 22 TEST(StandaloneVadTest, Api) { 23 rtc::scoped_ptr<StandaloneVad> vad(StandaloneVad::Create()); 24 int16_t data[kLength10Ms] = {0}; 25 26 // Valid frame length (for 32 kHz rate), but not what the VAD is expecting. 27 EXPECT_EQ(-1, vad->AddAudio(data, 320)); 28 29 const size_t kMaxNumFrames = 3; 30 double p[kMaxNumFrames]; 31 for (size_t n = 0; n < kMaxNumFrames; n++) 32 EXPECT_EQ(0, vad->AddAudio(data, kLength10Ms)); 33 34 // Pretend |p| is shorter that it should be. 35 EXPECT_EQ(-1, vad->GetActivity(p, kMaxNumFrames - 1)); 36 37 EXPECT_EQ(0, vad->GetActivity(p, kMaxNumFrames)); 38 39 // Ask for activity when buffer is empty. 40 EXPECT_EQ(-1, vad->GetActivity(p, kMaxNumFrames)); 41 42 // Should reset and result in one buffer. 43 for (size_t n = 0; n < kMaxNumFrames + 1; n++) 44 EXPECT_EQ(0, vad->AddAudio(data, kLength10Ms)); 45 EXPECT_EQ(0, vad->GetActivity(p, 1)); 46 47 // Wrong modes 48 EXPECT_EQ(-1, vad->set_mode(-1)); 49 EXPECT_EQ(-1, vad->set_mode(4)); 50 51 // Valid mode. 52 const int kMode = 2; 53 EXPECT_EQ(0, vad->set_mode(kMode)); 54 EXPECT_EQ(kMode, vad->mode()); 55 } 56 57 #if defined(WEBRTC_IOS) 58 TEST(StandaloneVadTest, DISABLED_ActivityDetection) { 59 #else 60 TEST(StandaloneVadTest, ActivityDetection) { 61 #endif 62 rtc::scoped_ptr<StandaloneVad> vad(StandaloneVad::Create()); 63 const size_t kDataLength = kLength10Ms; 64 int16_t data[kDataLength] = {0}; 65 66 FILE* pcm_file = 67 fopen(test::ResourcePath("audio_processing/agc/agc_audio", "pcm").c_str(), 68 "rb"); 69 ASSERT_TRUE(pcm_file != NULL); 70 71 FILE* reference_file = fopen( 72 test::ResourcePath("audio_processing/agc/agc_vad", "dat").c_str(), "rb"); 73 ASSERT_TRUE(reference_file != NULL); 74 75 // Reference activities are prepared with 0 aggressiveness. 76 ASSERT_EQ(0, vad->set_mode(0)); 77 78 // Stand-alone VAD can operate on 1, 2 or 3 frames of length 10 ms. The 79 // reference file is created for 30 ms frame. 80 const int kNumVadFramesToProcess = 3; 81 int num_frames = 0; 82 while (fread(data, sizeof(int16_t), kDataLength, pcm_file) == kDataLength) { 83 vad->AddAudio(data, kDataLength); 84 num_frames++; 85 if (num_frames == kNumVadFramesToProcess) { 86 num_frames = 0; 87 int referece_activity; 88 double p[kNumVadFramesToProcess]; 89 EXPECT_EQ(1u, fread(&referece_activity, sizeof(referece_activity), 1, 90 reference_file)); 91 int activity = vad->GetActivity(p, kNumVadFramesToProcess); 92 EXPECT_EQ(referece_activity, activity); 93 if (activity != 0) { 94 // When active, probabilities are set to 0.5. 95 for (int n = 0; n < kNumVadFramesToProcess; n++) 96 EXPECT_EQ(0.5, p[n]); 97 } else { 98 // When inactive, probabilities are set to 0.01. 99 for (int n = 0; n < kNumVadFramesToProcess; n++) 100 EXPECT_EQ(0.01, p[n]); 101 } 102 } 103 } 104 fclose(reference_file); 105 fclose(pcm_file); 106 } 107 } // namespace webrtc 108