1 files changed, 202 insertions, 0 deletions
diff --git a/src/modules/audio_processing/main/source/voice_detection_impl.cc b/src/modules/audio_processing/main/source/voice_detection_impl.cc
new file mode 100644
index 0000000000..3eb446e911
--- /dev/null
+++ b/src/modules/audio_processing/main/source/voice_detection_impl.cc
@@ -0,0 +1,202 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "voice_detection_impl.h"
+
+#include <cassert>
+
+#include "critical_section_wrapper.h"
+#include "webrtc_vad.h"
+
+#include "audio_processing_impl.h"
+#include "audio_buffer.h"
+
+namespace webrtc {
+
+typedef VadInst Handle;
+
+namespace {
+WebRtc_Word16 MapSetting(VoiceDetection::Likelihood likelihood) {
+  switch (likelihood) {
+    case VoiceDetection::kVeryLowLikelihood:
+      return 3;
+      break;
+    case VoiceDetection::kLowLikelihood:
+      return 2;
+      break;
+    case VoiceDetection::kModerateLikelihood:
+      return 1;
+      break;
+    case VoiceDetection::kHighLikelihood:
+      return 0;
+      break;
+    default:
+      return -1;
+  }
+}
+}  // namespace
+
+
+VoiceDetectionImpl::VoiceDetectionImpl(const AudioProcessingImpl* apm)
+  : ProcessingComponent(apm),
+    apm_(apm),
+    stream_has_voice_(false),
+    using_external_vad_(false),
+    likelihood_(kLowLikelihood),
+    frame_size_ms_(10),
+    frame_size_samples_(0) {}
+
+VoiceDetectionImpl::~VoiceDetectionImpl() {}
+
+int VoiceDetectionImpl::ProcessCaptureAudio(AudioBuffer* audio) {
+  if (!is_component_enabled()) {
+    return apm_->kNoError;
+  }
+
+  if (using_external_vad_) {
+    using_external_vad_ = false;
+    return apm_->kNoError;
+  }
+  assert(audio->samples_per_split_channel() <= 160);
+
+  WebRtc_Word16* mixed_data = audio->low_pass_split_data(0);
+  if (audio->num_channels() > 1) {
+    audio->CopyAndMixLowPass(1);
+    mixed_data = audio->mixed_low_pass_data(0);
+  }
+
+  // TODO(ajm): concatenate data in frame buffer here.
+
+  int vad_ret_val;
+  vad_ret_val = WebRtcVad_Process(static_cast<Handle*>(handle(0)),
+                      apm_->split_sample_rate_hz(),
+                      mixed_data,
+                      frame_size_samples_);
+
+  if (vad_ret_val == 0) {
+    stream_has_voice_ = false;
+  } else if (vad_ret_val == 1) {
+    stream_has_voice_ = true;
+  } else {
+    return apm_->kUnspecifiedError;
+  }
+
+  return apm_->kNoError;
+}
+
+int VoiceDetectionImpl::Enable(bool enable) {
+  CriticalSectionScoped crit_scoped(*apm_->crit());
+  return EnableComponent(enable);
+}
+
+bool VoiceDetectionImpl::is_enabled() const {
+  return is_component_enabled();
+}
+
+int VoiceDetectionImpl::set_stream_has_voice(bool has_voice) {
+  using_external_vad_ = true;
+  stream_has_voice_ = has_voice;
+  return apm_->kNoError;
+}
+
+bool VoiceDetectionImpl::stream_has_voice() const {
+  // TODO(ajm): enable this assertion?
+  //assert(using_external_vad_ || is_component_enabled());
+  return stream_has_voice_;
+}
+
+int VoiceDetectionImpl::set_likelihood(VoiceDetection::Likelihood likelihood) {
+  CriticalSectionScoped crit_scoped(*apm_->crit());
+  if (MapSetting(likelihood) == -1) {
+    return apm_->kBadParameterError;
+  }
+
+  likelihood_ = likelihood;
+  return Configure();
+}
+
+VoiceDetection::Likelihood VoiceDetectionImpl::likelihood() const {
+  return likelihood_;
+}
+
+int VoiceDetectionImpl::set_frame_size_ms(int size) {
+  CriticalSectionScoped crit_scoped(*apm_->crit());
+  assert(size == 10); // TODO(ajm): remove when supported.
+  if (size != 10 &&
+      size != 20 &&
+      size != 30) {
+    return apm_->kBadParameterError;
+  }
+
+  frame_size_ms_ = size;
+
+  return Initialize();
+}
+
+int VoiceDetectionImpl::frame_size_ms() const {
+  return frame_size_ms_;
+}
+
+int VoiceDetectionImpl::Initialize() {
+  int err = ProcessingComponent::Initialize();
+  if (err != apm_->kNoError || !is_component_enabled()) {
+    return err;
+  }
+
+  using_external_vad_ = false;
+  frame_size_samples_ = frame_size_ms_ * (apm_->split_sample_rate_hz() / 1000);
+  // TODO(ajm): intialize frame buffer here.
+
+  return apm_->kNoError;
+}
+
+int VoiceDetectionImpl::get_version(char* version,
+                                    int version_len_bytes) const {
+  if (WebRtcVad_get_version(version, version_len_bytes) != 0) {
+    return apm_->kBadParameterError;
+  }
+
+  return apm_->kNoError;
+}
+
+void* VoiceDetectionImpl::CreateHandle() const {
+  Handle* handle = NULL;
+  if (WebRtcVad_Create(&handle) != apm_->kNoError) {
+    handle = NULL;
+  } else {
+    assert(handle != NULL);
+  }
+
+  return handle;
+}
+
+int VoiceDetectionImpl::DestroyHandle(void* handle) const {
+  return WebRtcVad_Free(static_cast<Handle*>(handle));
+}
+
+int VoiceDetectionImpl::InitializeHandle(void* handle) const {
+  return WebRtcVad_Init(static_cast<Handle*>(handle));
+}
+
+int VoiceDetectionImpl::ConfigureHandle(void* handle) const {
+  return WebRtcVad_set_mode(static_cast<Handle*>(handle),
+                            MapSetting(likelihood_));
+}
+
+int VoiceDetectionImpl::num_handles_required() const {
+  return 1;
+}
+
+int VoiceDetectionImpl::GetHandleError(void* handle) const {
+  // The VAD has no get_error() function.
+  assert(handle != NULL);
+  return apm_->kUnspecifiedError;
+}
+}  // namespace webrtc