From bdbceeffe8a7360dd90958ccc1c30b478a08c350 Mon Sep 17 00:00:00 2001
From: peah <peah@webrtc.org>
Date: Sun, 20 Mar 2016 09:53:32 -0700
Subject: [PATCH] Added a bitexactness test for the voice activity detector in
 the audio processing module.

BUG=webrtc:5340

Review URL: https://codereview.webrtc.org/1804373002

Cr-Commit-Position: refs/heads/master@{#12066}
---
 .../voice_detection_unittest.cc               | 123 ++++++++++++++++++
 webrtc/modules/modules.gyp                    |   1 +
 2 files changed, 124 insertions(+)
 create mode 100644 webrtc/modules/audio_processing/voice_detection_unittest.cc
diff --git a/webrtc/modules/audio_processing/voice_detection_unittest.cc b/webrtc/modules/audio_processing/voice_detection_unittest.cc
new file mode 100644
index 0000000000..791bd55500
--- /dev/null
+++ b/webrtc/modules/audio_processing/voice_detection_unittest.cc
@@ -0,0 +1,123 @@
+/*
+ *  Copyright (c) 2016 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+#include <vector>
+
+#include "testing/gtest/include/gtest/gtest.h"
+#include "webrtc/base/array_view.h"
+#include "webrtc/modules/audio_processing/audio_buffer.h"
+#include "webrtc/modules/audio_processing/voice_detection_impl.h"
+#include "webrtc/modules/audio_processing/test/audio_buffer_tools.h"
+#include "webrtc/modules/audio_processing/test/bitexactness_tools.h"
+
+namespace webrtc {
+namespace {
+
+const int kNumFramesToProcess = 1000;
+
+// Process one frame of data and produce the output.
+void ProcessOneFrame(int sample_rate_hz,
+                     AudioBuffer* audio_buffer,
+                     VoiceDetectionImpl* voice_detection) {
+  if (sample_rate_hz > AudioProcessing::kSampleRate16kHz) {
+    audio_buffer->SplitIntoFrequencyBands();
+  }
+
+  voice_detection->ProcessCaptureAudio(audio_buffer);
+}
+
+// Processes a specified amount of frames, verifies the results and reports
+// any errors.
+void RunBitexactnessTest(int sample_rate_hz,
+                         size_t num_channels,
+                         int frame_size_ms_reference,
+                         bool stream_has_voice_reference,
+                         VoiceDetection::Likelihood likelihood_reference) {
+  rtc::CriticalSection crit_capture;
+  VoiceDetectionImpl voice_detection(&crit_capture);
+  voice_detection.Initialize(sample_rate_hz > 16000 ? 16000 : sample_rate_hz);
+  voice_detection.Enable(true);
+
+  int samples_per_channel = rtc::CheckedDivExact(sample_rate_hz, 100);
+  const StreamConfig capture_config(sample_rate_hz, num_channels, false);
+  AudioBuffer capture_buffer(
+      capture_config.num_frames(), capture_config.num_channels(),
+      capture_config.num_frames(), capture_config.num_channels(),
+      capture_config.num_frames());
+  test::InputAudioFile capture_file(
+      test::GetApmCaptureTestVectorFileName(sample_rate_hz));
+  std::vector<float> capture_input(samples_per_channel * num_channels);
+  for (int frame_no = 0; frame_no < kNumFramesToProcess; ++frame_no) {
+    ReadFloatSamplesFromStereoFile(samples_per_channel, num_channels,
+                                   &capture_file, capture_input);
+
+    test::CopyVectorToAudioBuffer(capture_config, capture_input,
+                                  &capture_buffer);
+
+    ProcessOneFrame(sample_rate_hz, &capture_buffer, &voice_detection);
+  }
+
+  int frame_size_ms = voice_detection.frame_size_ms();
+  bool stream_has_voice = voice_detection.stream_has_voice();
+  VoiceDetection::Likelihood likelihood = voice_detection.likelihood();
+
+  // Compare the outputs to the references.
+  EXPECT_EQ(frame_size_ms_reference, frame_size_ms);
+  EXPECT_EQ(stream_has_voice_reference, stream_has_voice);
+  EXPECT_EQ(likelihood_reference, likelihood);
+}
+
+const int kFrameSizeMsReference = 10;
+const bool kStreamHasVoiceReference = true;
+const VoiceDetection::Likelihood kLikelihoodReference =
+    VoiceDetection::kLowLikelihood;
+
+}  // namespace
+
+TEST(VoiceDetectionBitExactnessTest, Mono8kHz) {
+  RunBitexactnessTest(8000, 1, kFrameSizeMsReference, kStreamHasVoiceReference,
+                      kLikelihoodReference);
+}
+
+TEST(VoiceDetectionBitExactnessTest, Mono16kHz) {
+  RunBitexactnessTest(16000, 1, kFrameSizeMsReference, kStreamHasVoiceReference,
+                      kLikelihoodReference);
+}
+
+TEST(VoiceDetectionBitExactnessTest, Mono32kHz) {
+  RunBitexactnessTest(32000, 1, kFrameSizeMsReference, kStreamHasVoiceReference,
+                      kLikelihoodReference);
+}
+
+TEST(VoiceDetectionBitExactnessTest, Mono48kHz) {
+  RunBitexactnessTest(48000, 1, kFrameSizeMsReference, kStreamHasVoiceReference,
+                      kLikelihoodReference);
+}
+
+TEST(VoiceDetectionBitExactnessTest, Stereo8kHz) {
+  RunBitexactnessTest(8000, 2, kFrameSizeMsReference, kStreamHasVoiceReference,
+                      kLikelihoodReference);
+}
+
+TEST(VoiceDetectionBitExactnessTest, Stereo16kHz) {
+  RunBitexactnessTest(16000, 2, kFrameSizeMsReference, kStreamHasVoiceReference,
+                      kLikelihoodReference);
+}
+
+TEST(VoiceDetectionBitExactnessTest, Stereo32kHz) {
+  RunBitexactnessTest(32000, 2, kFrameSizeMsReference, kStreamHasVoiceReference,
+                      kLikelihoodReference);
+}
+
+TEST(VoiceDetectionBitExactnessTest, Stereo48kHz) {
+  RunBitexactnessTest(48000, 2, kFrameSizeMsReference, kStreamHasVoiceReference,
+                      kLikelihoodReference);
+}
+
+}  // namespace webrtc
diff --git a/webrtc/modules/modules.gyp b/webrtc/modules/modules.gyp
index 99013411e7..aea7916401 100644
--- a/webrtc/modules/modules.gyp
+++ b/webrtc/modules/modules.gyp
@@ -443,6 +443,7 @@
                 'audio_processing/high_pass_filter_bitexactness_unittest.cc',
                 'audio_processing/level_estimator_bitexactness_unittest.cc',
                 'audio_processing/noise_suppression_bitexactness_unittest.cc',
+                'audio_processing/voice_detection_unittest.cc',
                 'audio_processing/test/audio_buffer_tools.cc',
                 'audio_processing/test/audio_buffer_tools.h',
                 'audio_processing/test/audio_processing_unittest.cc',