1 /* 2 * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved. 3 * 4 * Use of this source code is governed by a BSD-style license 5 * that can be found in the LICENSE file in the root of the source 6 * tree. An additional intellectual property rights grant can be found 7 * in the file PATENTS. All contributing project authors may 8 * be found in the AUTHORS file in the root of the source tree. 9 */ 10 11 #ifndef WEBRTC_MODULES_AUDIO_PROCESSING_AUDIO_PROCESSING_IMPL_H_ 12 #define WEBRTC_MODULES_AUDIO_PROCESSING_AUDIO_PROCESSING_IMPL_H_ 13 14 #include <list> 15 #include <string> 16 #include <vector> 17 18 #include "webrtc/base/criticalsection.h" 19 #include "webrtc/base/scoped_ptr.h" 20 #include "webrtc/base/thread_annotations.h" 21 #include "webrtc/modules/audio_processing/audio_buffer.h" 22 #include "webrtc/modules/audio_processing/include/audio_processing.h" 23 #include "webrtc/system_wrappers/include/file_wrapper.h" 24 25 #ifdef WEBRTC_AUDIOPROC_DEBUG_DUMP 26 // Files generated at build-time by the protobuf compiler. 27 #ifdef WEBRTC_ANDROID_PLATFORM_BUILD 28 #include "external/webrtc/webrtc/modules/audio_processing/debug.pb.h" 29 #else 30 #include "webrtc/audio_processing/debug.pb.h" 31 #endif 32 #endif // WEBRTC_AUDIOPROC_DEBUG_DUMP 33 34 namespace webrtc { 35 36 class AgcManagerDirect; 37 class AudioConverter; 38 39 template<typename T> 40 class Beamformer; 41 42 class AudioProcessingImpl : public AudioProcessing { 43 public: 44 // Methods forcing APM to run in a single-threaded manner. 45 // Acquires both the render and capture locks. 46 explicit AudioProcessingImpl(const Config& config); 47 // AudioProcessingImpl takes ownership of beamformer. 48 AudioProcessingImpl(const Config& config, Beamformer<float>* beamformer); 49 virtual ~AudioProcessingImpl(); 50 int Initialize() override; 51 int Initialize(int input_sample_rate_hz, 52 int output_sample_rate_hz, 53 int reverse_sample_rate_hz, 54 ChannelLayout input_layout, 55 ChannelLayout output_layout, 56 ChannelLayout reverse_layout) override; 57 int Initialize(const ProcessingConfig& processing_config) override; 58 void SetExtraOptions(const Config& config) override; 59 void UpdateHistogramsOnCallEnd() override; 60 int StartDebugRecording(const char filename[kMaxFilenameSize]) override; 61 int StartDebugRecording(FILE* handle) override; 62 int StartDebugRecordingForPlatformFile(rtc::PlatformFile handle) override; 63 int StopDebugRecording() override; 64 65 // Capture-side exclusive methods possibly running APM in a 66 // multi-threaded manner. Acquire the capture lock. 67 int ProcessStream(AudioFrame* frame) override; 68 int ProcessStream(const float* const* src, 69 size_t samples_per_channel, 70 int input_sample_rate_hz, 71 ChannelLayout input_layout, 72 int output_sample_rate_hz, 73 ChannelLayout output_layout, 74 float* const* dest) override; 75 int ProcessStream(const float* const* src, 76 const StreamConfig& input_config, 77 const StreamConfig& output_config, 78 float* const* dest) override; 79 void set_output_will_be_muted(bool muted) override; 80 int set_stream_delay_ms(int delay) override; 81 void set_delay_offset_ms(int offset) override; 82 int delay_offset_ms() const override; 83 void set_stream_key_pressed(bool key_pressed) override; 84 int input_sample_rate_hz() const override; 85 86 // Render-side exclusive methods possibly running APM in a 87 // multi-threaded manner. Acquire the render lock. 88 int AnalyzeReverseStream(AudioFrame* frame) override; 89 int ProcessReverseStream(AudioFrame* frame) override; 90 int AnalyzeReverseStream(const float* const* data, 91 size_t samples_per_channel, 92 int sample_rate_hz, 93 ChannelLayout layout) override; 94 int ProcessReverseStream(const float* const* src, 95 const StreamConfig& reverse_input_config, 96 const StreamConfig& reverse_output_config, 97 float* const* dest) override; 98 99 // Methods only accessed from APM submodules or 100 // from AudioProcessing tests in a single-threaded manner. 101 // Hence there is no need for locks in these. 102 int proc_sample_rate_hz() const override; 103 int proc_split_sample_rate_hz() const override; 104 size_t num_input_channels() const override; 105 size_t num_proc_channels() const override; 106 size_t num_output_channels() const override; 107 size_t num_reverse_channels() const override; 108 int stream_delay_ms() const override; 109 bool was_stream_delay_set() const override 110 EXCLUSIVE_LOCKS_REQUIRED(crit_capture_); 111 112 // Methods returning pointers to APM submodules. 113 // No locks are aquired in those, as those locks 114 // would offer no protection (the submodules are 115 // created only once in a single-treaded manner 116 // during APM creation). 117 EchoCancellation* echo_cancellation() const override; 118 EchoControlMobile* echo_control_mobile() const override; 119 GainControl* gain_control() const override; 120 HighPassFilter* high_pass_filter() const override; 121 LevelEstimator* level_estimator() const override; 122 NoiseSuppression* noise_suppression() const override; 123 VoiceDetection* voice_detection() const override; 124 125 protected: 126 // Overridden in a mock. 127 virtual int InitializeLocked() 128 EXCLUSIVE_LOCKS_REQUIRED(crit_render_, crit_capture_); 129 130 private: 131 struct ApmPublicSubmodules; 132 struct ApmPrivateSubmodules; 133 134 #ifdef WEBRTC_AUDIOPROC_DEBUG_DUMP 135 // State for the debug dump. 136 struct ApmDebugDumpThreadState { 137 ApmDebugDumpThreadState() : event_msg(new audioproc::Event()) {} 138 rtc::scoped_ptr<audioproc::Event> event_msg; // Protobuf message. 139 std::string event_str; // Memory for protobuf serialization. 140 141 // Serialized string of last saved APM configuration. 142 std::string last_serialized_config; 143 }; 144 145 struct ApmDebugDumpState { 146 ApmDebugDumpState() : debug_file(FileWrapper::Create()) {} 147 rtc::scoped_ptr<FileWrapper> debug_file; 148 ApmDebugDumpThreadState render; 149 ApmDebugDumpThreadState capture; 150 }; 151 #endif 152 153 // Method for modifying the formats struct that are called from both 154 // the render and capture threads. The check for whether modifications 155 // are needed is done while holding the render lock only, thereby avoiding 156 // that the capture thread blocks the render thread. 157 // The struct is modified in a single-threaded manner by holding both the 158 // render and capture locks. 159 int MaybeInitialize(const ProcessingConfig& config) 160 EXCLUSIVE_LOCKS_REQUIRED(crit_render_); 161 162 int MaybeInitializeRender(const ProcessingConfig& processing_config) 163 EXCLUSIVE_LOCKS_REQUIRED(crit_render_); 164 165 int MaybeInitializeCapture(const ProcessingConfig& processing_config) 166 EXCLUSIVE_LOCKS_REQUIRED(crit_render_); 167 168 // Method for checking for the need of conversion. Accesses the formats 169 // structs in a read manner but the requirement for the render lock to be held 170 // was added as it currently anyway is always called in that manner. 171 bool rev_conversion_needed() const EXCLUSIVE_LOCKS_REQUIRED(crit_render_); 172 bool render_check_rev_conversion_needed() const 173 EXCLUSIVE_LOCKS_REQUIRED(crit_render_); 174 175 // Methods requiring APM running in a single-threaded manner. 176 // Are called with both the render and capture locks already 177 // acquired. 178 void InitializeExperimentalAgc() 179 EXCLUSIVE_LOCKS_REQUIRED(crit_render_, crit_capture_); 180 void InitializeTransient() 181 EXCLUSIVE_LOCKS_REQUIRED(crit_render_, crit_capture_); 182 void InitializeBeamformer() 183 EXCLUSIVE_LOCKS_REQUIRED(crit_render_, crit_capture_); 184 void InitializeIntelligibility() 185 EXCLUSIVE_LOCKS_REQUIRED(crit_render_, crit_capture_); 186 void InitializeHighPassFilter() 187 EXCLUSIVE_LOCKS_REQUIRED(crit_capture_); 188 void InitializeNoiseSuppression() 189 EXCLUSIVE_LOCKS_REQUIRED(crit_capture_); 190 void InitializeLevelEstimator() 191 EXCLUSIVE_LOCKS_REQUIRED(crit_capture_); 192 void InitializeVoiceDetection() 193 EXCLUSIVE_LOCKS_REQUIRED(crit_capture_); 194 int InitializeLocked(const ProcessingConfig& config) 195 EXCLUSIVE_LOCKS_REQUIRED(crit_render_, crit_capture_); 196 197 // Capture-side exclusive methods possibly running APM in a multi-threaded 198 // manner that are called with the render lock already acquired. 199 int ProcessStreamLocked() EXCLUSIVE_LOCKS_REQUIRED(crit_capture_); 200 bool output_copy_needed(bool is_data_processed) const 201 EXCLUSIVE_LOCKS_REQUIRED(crit_capture_); 202 bool is_data_processed() const EXCLUSIVE_LOCKS_REQUIRED(crit_capture_); 203 bool synthesis_needed(bool is_data_processed) const 204 EXCLUSIVE_LOCKS_REQUIRED(crit_capture_); 205 bool analysis_needed(bool is_data_processed) const 206 EXCLUSIVE_LOCKS_REQUIRED(crit_capture_); 207 void MaybeUpdateHistograms() EXCLUSIVE_LOCKS_REQUIRED(crit_capture_); 208 209 // Render-side exclusive methods possibly running APM in a multi-threaded 210 // manner that are called with the render lock already acquired. 211 // TODO(ekm): Remove once all clients updated to new interface. 212 int AnalyzeReverseStreamLocked(const float* const* src, 213 const StreamConfig& input_config, 214 const StreamConfig& output_config) 215 EXCLUSIVE_LOCKS_REQUIRED(crit_render_); 216 bool is_rev_processed() const EXCLUSIVE_LOCKS_REQUIRED(crit_render_); 217 int ProcessReverseStreamLocked() EXCLUSIVE_LOCKS_REQUIRED(crit_render_); 218 219 // Debug dump methods that are internal and called without locks. 220 // TODO(peah): Make thread safe. 221 #ifdef WEBRTC_AUDIOPROC_DEBUG_DUMP 222 // TODO(andrew): make this more graceful. Ideally we would split this stuff 223 // out into a separate class with an "enabled" and "disabled" implementation. 224 static int WriteMessageToDebugFile(FileWrapper* debug_file, 225 rtc::CriticalSection* crit_debug, 226 ApmDebugDumpThreadState* debug_state); 227 int WriteInitMessage() EXCLUSIVE_LOCKS_REQUIRED(crit_render_, crit_capture_); 228 229 // Writes Config message. If not |forced|, only writes the current config if 230 // it is different from the last saved one; if |forced|, writes the config 231 // regardless of the last saved. 232 int WriteConfigMessage(bool forced) EXCLUSIVE_LOCKS_REQUIRED(crit_capture_) 233 EXCLUSIVE_LOCKS_REQUIRED(crit_capture_); 234 235 // Critical section. 236 mutable rtc::CriticalSection crit_debug_; 237 238 // Debug dump state. 239 ApmDebugDumpState debug_dump_; 240 #endif 241 242 // Critical sections. 243 mutable rtc::CriticalSection crit_render_ ACQUIRED_BEFORE(crit_capture_); 244 mutable rtc::CriticalSection crit_capture_; 245 246 // Structs containing the pointers to the submodules. 247 rtc::scoped_ptr<ApmPublicSubmodules> public_submodules_; 248 rtc::scoped_ptr<ApmPrivateSubmodules> private_submodules_ 249 GUARDED_BY(crit_capture_); 250 251 // State that is written to while holding both the render and capture locks 252 // but can be read without any lock being held. 253 // As this is only accessed internally of APM, and all internal methods in APM 254 // either are holding the render or capture locks, this construct is safe as 255 // it is not possible to read the variables while writing them. 256 struct ApmFormatState { 257 ApmFormatState() 258 : // Format of processing streams at input/output call sites. 259 api_format({{{kSampleRate16kHz, 1, false}, 260 {kSampleRate16kHz, 1, false}, 261 {kSampleRate16kHz, 1, false}, 262 {kSampleRate16kHz, 1, false}}}), 263 rev_proc_format(kSampleRate16kHz, 1) {} 264 ProcessingConfig api_format; 265 StreamConfig rev_proc_format; 266 } formats_; 267 268 // APM constants. 269 const struct ApmConstants { 270 ApmConstants(int agc_startup_min_volume, 271 bool use_new_agc, 272 bool intelligibility_enabled) 273 : // Format of processing streams at input/output call sites. 274 agc_startup_min_volume(agc_startup_min_volume), 275 use_new_agc(use_new_agc), 276 intelligibility_enabled(intelligibility_enabled) {} 277 int agc_startup_min_volume; 278 bool use_new_agc; 279 bool intelligibility_enabled; 280 } constants_; 281 282 struct ApmCaptureState { 283 ApmCaptureState(bool transient_suppressor_enabled, 284 const std::vector<Point>& array_geometry, 285 SphericalPointf target_direction) 286 : aec_system_delay_jumps(-1), 287 delay_offset_ms(0), 288 was_stream_delay_set(false), 289 last_stream_delay_ms(0), 290 last_aec_system_delay_ms(0), 291 stream_delay_jumps(-1), 292 output_will_be_muted(false), 293 key_pressed(false), 294 transient_suppressor_enabled(transient_suppressor_enabled), 295 array_geometry(array_geometry), 296 target_direction(target_direction), 297 fwd_proc_format(kSampleRate16kHz), 298 split_rate(kSampleRate16kHz) {} 299 int aec_system_delay_jumps; 300 int delay_offset_ms; 301 bool was_stream_delay_set; 302 int last_stream_delay_ms; 303 int last_aec_system_delay_ms; 304 int stream_delay_jumps; 305 bool output_will_be_muted; 306 bool key_pressed; 307 bool transient_suppressor_enabled; 308 std::vector<Point> array_geometry; 309 SphericalPointf target_direction; 310 rtc::scoped_ptr<AudioBuffer> capture_audio; 311 // Only the rate and samples fields of fwd_proc_format_ are used because the 312 // forward processing number of channels is mutable and is tracked by the 313 // capture_audio_. 314 StreamConfig fwd_proc_format; 315 int split_rate; 316 } capture_ GUARDED_BY(crit_capture_); 317 318 struct ApmCaptureNonLockedState { 319 ApmCaptureNonLockedState(bool beamformer_enabled) 320 : fwd_proc_format(kSampleRate16kHz), 321 split_rate(kSampleRate16kHz), 322 stream_delay_ms(0), 323 beamformer_enabled(beamformer_enabled) {} 324 // Only the rate and samples fields of fwd_proc_format_ are used because the 325 // forward processing number of channels is mutable and is tracked by the 326 // capture_audio_. 327 StreamConfig fwd_proc_format; 328 int split_rate; 329 int stream_delay_ms; 330 bool beamformer_enabled; 331 } capture_nonlocked_; 332 333 struct ApmRenderState { 334 rtc::scoped_ptr<AudioConverter> render_converter; 335 rtc::scoped_ptr<AudioBuffer> render_audio; 336 } render_ GUARDED_BY(crit_render_); 337 }; 338 339 } // namespace webrtc 340 341 #endif // WEBRTC_MODULES_AUDIO_PROCESSING_AUDIO_PROCESSING_IMPL_H_ 342