/* * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved. * * Use of this source code is governed by a BSD-style license * that can be found in the LICENSE file in the root of the source * tree. An additional intellectual property rights grant can be found * in the file PATENTS. All contributing project authors may * be found in the AUTHORS file in the root of the source tree. */ #ifndef WEBRTC_MODULES_AUDIO_PROCESSING_AUDIO_PROCESSING_IMPL_H_ #define WEBRTC_MODULES_AUDIO_PROCESSING_AUDIO_PROCESSING_IMPL_H_ #include #include #include #include "webrtc/base/criticalsection.h" #include "webrtc/base/scoped_ptr.h" #include "webrtc/base/thread_annotations.h" #include "webrtc/modules/audio_processing/audio_buffer.h" #include "webrtc/modules/audio_processing/include/audio_processing.h" #include "webrtc/system_wrappers/include/file_wrapper.h" #ifdef WEBRTC_AUDIOPROC_DEBUG_DUMP // Files generated at build-time by the protobuf compiler. #ifdef WEBRTC_ANDROID_PLATFORM_BUILD #include "external/webrtc/webrtc/modules/audio_processing/debug.pb.h" #else #include "webrtc/audio_processing/debug.pb.h" #endif #endif // WEBRTC_AUDIOPROC_DEBUG_DUMP namespace webrtc { class AgcManagerDirect; class AudioConverter; template class Beamformer; class AudioProcessingImpl : public AudioProcessing { public: // Methods forcing APM to run in a single-threaded manner. // Acquires both the render and capture locks. explicit AudioProcessingImpl(const Config& config); // AudioProcessingImpl takes ownership of beamformer. AudioProcessingImpl(const Config& config, Beamformer* beamformer); virtual ~AudioProcessingImpl(); int Initialize() override; int Initialize(int input_sample_rate_hz, int output_sample_rate_hz, int reverse_sample_rate_hz, ChannelLayout input_layout, ChannelLayout output_layout, ChannelLayout reverse_layout) override; int Initialize(const ProcessingConfig& processing_config) override; void SetExtraOptions(const Config& config) override; void UpdateHistogramsOnCallEnd() override; int StartDebugRecording(const char filename[kMaxFilenameSize]) override; int StartDebugRecording(FILE* handle) override; int StartDebugRecordingForPlatformFile(rtc::PlatformFile handle) override; int StopDebugRecording() override; // Capture-side exclusive methods possibly running APM in a // multi-threaded manner. Acquire the capture lock. int ProcessStream(AudioFrame* frame) override; int ProcessStream(const float* const* src, size_t samples_per_channel, int input_sample_rate_hz, ChannelLayout input_layout, int output_sample_rate_hz, ChannelLayout output_layout, float* const* dest) override; int ProcessStream(const float* const* src, const StreamConfig& input_config, const StreamConfig& output_config, float* const* dest) override; void set_output_will_be_muted(bool muted) override; int set_stream_delay_ms(int delay) override; void set_delay_offset_ms(int offset) override; int delay_offset_ms() const override; void set_stream_key_pressed(bool key_pressed) override; int input_sample_rate_hz() const override; // Render-side exclusive methods possibly running APM in a // multi-threaded manner. Acquire the render lock. int AnalyzeReverseStream(AudioFrame* frame) override; int ProcessReverseStream(AudioFrame* frame) override; int AnalyzeReverseStream(const float* const* data, size_t samples_per_channel, int sample_rate_hz, ChannelLayout layout) override; int ProcessReverseStream(const float* const* src, const StreamConfig& reverse_input_config, const StreamConfig& reverse_output_config, float* const* dest) override; // Methods only accessed from APM submodules or // from AudioProcessing tests in a single-threaded manner. // Hence there is no need for locks in these. int proc_sample_rate_hz() const override; int proc_split_sample_rate_hz() const override; size_t num_input_channels() const override; size_t num_proc_channels() const override; size_t num_output_channels() const override; size_t num_reverse_channels() const override; int stream_delay_ms() const override; bool was_stream_delay_set() const override EXCLUSIVE_LOCKS_REQUIRED(crit_capture_); // Methods returning pointers to APM submodules. // No locks are aquired in those, as those locks // would offer no protection (the submodules are // created only once in a single-treaded manner // during APM creation). EchoCancellation* echo_cancellation() const override; EchoControlMobile* echo_control_mobile() const override; GainControl* gain_control() const override; HighPassFilter* high_pass_filter() const override; LevelEstimator* level_estimator() const override; NoiseSuppression* noise_suppression() const override; VoiceDetection* voice_detection() const override; protected: // Overridden in a mock. virtual int InitializeLocked() EXCLUSIVE_LOCKS_REQUIRED(crit_render_, crit_capture_); private: struct ApmPublicSubmodules; struct ApmPrivateSubmodules; #ifdef WEBRTC_AUDIOPROC_DEBUG_DUMP // State for the debug dump. struct ApmDebugDumpThreadState { ApmDebugDumpThreadState() : event_msg(new audioproc::Event()) {} rtc::scoped_ptr event_msg; // Protobuf message. std::string event_str; // Memory for protobuf serialization. // Serialized string of last saved APM configuration. std::string last_serialized_config; }; struct ApmDebugDumpState { ApmDebugDumpState() : debug_file(FileWrapper::Create()) {} rtc::scoped_ptr debug_file; ApmDebugDumpThreadState render; ApmDebugDumpThreadState capture; }; #endif // Method for modifying the formats struct that are called from both // the render and capture threads. The check for whether modifications // are needed is done while holding the render lock only, thereby avoiding // that the capture thread blocks the render thread. // The struct is modified in a single-threaded manner by holding both the // render and capture locks. int MaybeInitialize(const ProcessingConfig& config) EXCLUSIVE_LOCKS_REQUIRED(crit_render_); int MaybeInitializeRender(const ProcessingConfig& processing_config) EXCLUSIVE_LOCKS_REQUIRED(crit_render_); int MaybeInitializeCapture(const ProcessingConfig& processing_config) EXCLUSIVE_LOCKS_REQUIRED(crit_render_); // Method for checking for the need of conversion. Accesses the formats // structs in a read manner but the requirement for the render lock to be held // was added as it currently anyway is always called in that manner. bool rev_conversion_needed() const EXCLUSIVE_LOCKS_REQUIRED(crit_render_); bool render_check_rev_conversion_needed() const EXCLUSIVE_LOCKS_REQUIRED(crit_render_); // Methods requiring APM running in a single-threaded manner. // Are called with both the render and capture locks already // acquired. void InitializeExperimentalAgc() EXCLUSIVE_LOCKS_REQUIRED(crit_render_, crit_capture_); void InitializeTransient() EXCLUSIVE_LOCKS_REQUIRED(crit_render_, crit_capture_); void InitializeBeamformer() EXCLUSIVE_LOCKS_REQUIRED(crit_render_, crit_capture_); void InitializeIntelligibility() EXCLUSIVE_LOCKS_REQUIRED(crit_render_, crit_capture_); void InitializeHighPassFilter() EXCLUSIVE_LOCKS_REQUIRED(crit_capture_); void InitializeNoiseSuppression() EXCLUSIVE_LOCKS_REQUIRED(crit_capture_); void InitializeLevelEstimator() EXCLUSIVE_LOCKS_REQUIRED(crit_capture_); void InitializeVoiceDetection() EXCLUSIVE_LOCKS_REQUIRED(crit_capture_); int InitializeLocked(const ProcessingConfig& config) EXCLUSIVE_LOCKS_REQUIRED(crit_render_, crit_capture_); // Capture-side exclusive methods possibly running APM in a multi-threaded // manner that are called with the render lock already acquired. int ProcessStreamLocked() EXCLUSIVE_LOCKS_REQUIRED(crit_capture_); bool output_copy_needed(bool is_data_processed) const EXCLUSIVE_LOCKS_REQUIRED(crit_capture_); bool is_data_processed() const EXCLUSIVE_LOCKS_REQUIRED(crit_capture_); bool synthesis_needed(bool is_data_processed) const EXCLUSIVE_LOCKS_REQUIRED(crit_capture_); bool analysis_needed(bool is_data_processed) const EXCLUSIVE_LOCKS_REQUIRED(crit_capture_); void MaybeUpdateHistograms() EXCLUSIVE_LOCKS_REQUIRED(crit_capture_); // Render-side exclusive methods possibly running APM in a multi-threaded // manner that are called with the render lock already acquired. // TODO(ekm): Remove once all clients updated to new interface. int AnalyzeReverseStreamLocked(const float* const* src, const StreamConfig& input_config, const StreamConfig& output_config) EXCLUSIVE_LOCKS_REQUIRED(crit_render_); bool is_rev_processed() const EXCLUSIVE_LOCKS_REQUIRED(crit_render_); int ProcessReverseStreamLocked() EXCLUSIVE_LOCKS_REQUIRED(crit_render_); // Debug dump methods that are internal and called without locks. // TODO(peah): Make thread safe. #ifdef WEBRTC_AUDIOPROC_DEBUG_DUMP // TODO(andrew): make this more graceful. Ideally we would split this stuff // out into a separate class with an "enabled" and "disabled" implementation. static int WriteMessageToDebugFile(FileWrapper* debug_file, rtc::CriticalSection* crit_debug, ApmDebugDumpThreadState* debug_state); int WriteInitMessage() EXCLUSIVE_LOCKS_REQUIRED(crit_render_, crit_capture_); // Writes Config message. If not |forced|, only writes the current config if // it is different from the last saved one; if |forced|, writes the config // regardless of the last saved. int WriteConfigMessage(bool forced) EXCLUSIVE_LOCKS_REQUIRED(crit_capture_) EXCLUSIVE_LOCKS_REQUIRED(crit_capture_); // Critical section. mutable rtc::CriticalSection crit_debug_; // Debug dump state. ApmDebugDumpState debug_dump_; #endif // Critical sections. mutable rtc::CriticalSection crit_render_ ACQUIRED_BEFORE(crit_capture_); mutable rtc::CriticalSection crit_capture_; // Structs containing the pointers to the submodules. rtc::scoped_ptr public_submodules_; rtc::scoped_ptr private_submodules_ GUARDED_BY(crit_capture_); // State that is written to while holding both the render and capture locks // but can be read without any lock being held. // As this is only accessed internally of APM, and all internal methods in APM // either are holding the render or capture locks, this construct is safe as // it is not possible to read the variables while writing them. struct ApmFormatState { ApmFormatState() : // Format of processing streams at input/output call sites. api_format({{{kSampleRate16kHz, 1, false}, {kSampleRate16kHz, 1, false}, {kSampleRate16kHz, 1, false}, {kSampleRate16kHz, 1, false}}}), rev_proc_format(kSampleRate16kHz, 1) {} ProcessingConfig api_format; StreamConfig rev_proc_format; } formats_; // APM constants. const struct ApmConstants { ApmConstants(int agc_startup_min_volume, bool use_new_agc, bool intelligibility_enabled) : // Format of processing streams at input/output call sites. agc_startup_min_volume(agc_startup_min_volume), use_new_agc(use_new_agc), intelligibility_enabled(intelligibility_enabled) {} int agc_startup_min_volume; bool use_new_agc; bool intelligibility_enabled; } constants_; struct ApmCaptureState { ApmCaptureState(bool transient_suppressor_enabled, const std::vector& array_geometry, SphericalPointf target_direction) : aec_system_delay_jumps(-1), delay_offset_ms(0), was_stream_delay_set(false), last_stream_delay_ms(0), last_aec_system_delay_ms(0), stream_delay_jumps(-1), output_will_be_muted(false), key_pressed(false), transient_suppressor_enabled(transient_suppressor_enabled), array_geometry(array_geometry), target_direction(target_direction), fwd_proc_format(kSampleRate16kHz), split_rate(kSampleRate16kHz) {} int aec_system_delay_jumps; int delay_offset_ms; bool was_stream_delay_set; int last_stream_delay_ms; int last_aec_system_delay_ms; int stream_delay_jumps; bool output_will_be_muted; bool key_pressed; bool transient_suppressor_enabled; std::vector array_geometry; SphericalPointf target_direction; rtc::scoped_ptr capture_audio; // Only the rate and samples fields of fwd_proc_format_ are used because the // forward processing number of channels is mutable and is tracked by the // capture_audio_. StreamConfig fwd_proc_format; int split_rate; } capture_ GUARDED_BY(crit_capture_); struct ApmCaptureNonLockedState { ApmCaptureNonLockedState(bool beamformer_enabled) : fwd_proc_format(kSampleRate16kHz), split_rate(kSampleRate16kHz), stream_delay_ms(0), beamformer_enabled(beamformer_enabled) {} // Only the rate and samples fields of fwd_proc_format_ are used because the // forward processing number of channels is mutable and is tracked by the // capture_audio_. StreamConfig fwd_proc_format; int split_rate; int stream_delay_ms; bool beamformer_enabled; } capture_nonlocked_; struct ApmRenderState { rtc::scoped_ptr render_converter; rtc::scoped_ptr render_audio; } render_ GUARDED_BY(crit_render_); }; } // namespace webrtc #endif // WEBRTC_MODULES_AUDIO_PROCESSING_AUDIO_PROCESSING_IMPL_H_