Index: webrtc/modules/audio_processing/level_controller/level_controller.cc |
diff --git a/webrtc/modules/audio_processing/level_controller/level_controller.cc b/webrtc/modules/audio_processing/level_controller/level_controller.cc |
new file mode 100644 |
index 0000000000000000000000000000000000000000..fa26c059cbbb333c7fbe481b59ffb49495990bc3 |
--- /dev/null |
+++ b/webrtc/modules/audio_processing/level_controller/level_controller.cc |
@@ -0,0 +1,147 @@ |
+/* |
+ * Copyright (c) 2016 The WebRTC project authors. All Rights Reserved. |
+ * |
+ * Use of this source code is governed by a BSD-style license |
+ * that can be found in the LICENSE file in the root of the source |
+ * tree. An additional intellectual property rights grant can be found |
+ * in the file PATENTS. All contributing project authors may |
+ * be found in the AUTHORS file in the root of the source tree. |
+ */ |
+ |
+#include "webrtc/modules/audio_processing/level_controller/level_controller.h" |
+ |
+#include <algorithm> |
+#include <numeric> |
+ |
+#include "webrtc/base/array_view.h" |
+#include "webrtc/base/checks.h" |
+#include "webrtc/modules/audio_processing/audio_buffer.h" |
+#include "webrtc/modules/audio_processing/level_controller/gain_applier.h" |
+#include "webrtc/modules/audio_processing/level_controller/gain_selector.h" |
+#include "webrtc/modules/audio_processing/level_controller/noise_level_estimator.h" |
+#include "webrtc/modules/audio_processing/level_controller/peak_level_estimator.h" |
+#include "webrtc/modules/audio_processing/level_controller/saturating_gain_estimator.h" |
+#include "webrtc/modules/audio_processing/level_controller/signal_classifier.h" |
+#include "webrtc/modules/audio_processing/logging/apm_data_dumper.h" |
+ |
+namespace webrtc { |
+namespace { |
+ |
+void UpdateAndRemoveDcLevel(float forgetting_factor, |
+ float* dc_level, |
+ rtc::ArrayView<float> x) { |
+ RTC_DCHECK(!x.empty()); |
+ float mean = |
+ std::accumulate(x.begin(), x.end(), 0) / static_cast<float>(x.size()); |
+ *dc_level += forgetting_factor * (mean - *dc_level); |
+ |
+ for (float& v : x) { |
+ v -= *dc_level; |
+ } |
+} |
+ |
+float FrameEnergy(const AudioBuffer& audio) { |
+ float energy = 0.f; |
+ for (size_t k = 0; k < audio.num_channels(); ++k) { |
+ float channel_energy = |
+ std::accumulate(audio.channels_const_f()[k], |
+ audio.channels_const_f()[k] + audio.num_frames(), 0, |
+ [](float a, float b) -> float { return a + b * b; }); |
+ energy = std::max(channel_energy, energy); |
+ } |
+ return energy; |
+} |
+ |
+float PeakLevel(const AudioBuffer& audio) { |
+ float peak_level = 0.f; |
+ for (size_t k = 0; k < audio.num_channels(); ++k) { |
+ auto channel_peak_level = std::max_element( |
+ audio.channels_const_f()[k], |
+ audio.channels_const_f()[k] + audio.num_frames(), |
+ [](float a, float b) { return std::abs(a) < std::abs(b); }); |
+ peak_level = std::max(*channel_peak_level, peak_level); |
+ } |
+ return peak_level; |
+} |
+ |
+} // namespace |
+ |
+int LevelController::instance_count_ = 0; |
+ |
+LevelController::LevelController() |
+ : data_dumper_(new ApmDataDumper(instance_count_)), |
+ gain_applier_(data_dumper_.get()), |
+ signal_classifier_(data_dumper_.get()) { |
+ Initialize(AudioProcessing::kSampleRate48kHz); |
+ ++instance_count_; |
+} |
+ |
+LevelController::~LevelController() {} |
+ |
+void LevelController::Initialize(int sample_rate_hz) { |
+ RTC_DCHECK(sample_rate_hz == AudioProcessing::kSampleRate8kHz || |
+ sample_rate_hz == AudioProcessing::kSampleRate16kHz || |
+ sample_rate_hz == AudioProcessing::kSampleRate32kHz || |
+ sample_rate_hz == AudioProcessing::kSampleRate48kHz); |
+ data_dumper_->InitiateNewSetOfRecordings(); |
+ gain_selector_.Initialize(sample_rate_hz); |
+ gain_applier_.Initialize(sample_rate_hz); |
+ signal_classifier_.Initialize(sample_rate_hz); |
+ noise_level_estimator_.Initialize(sample_rate_hz); |
+ peak_level_estimator_.Initialize(); |
+ saturating_gain_estimator_.Initialize(); |
+ |
+ sample_rate_hz_ = rtc::Optional<int>(sample_rate_hz); |
+ dc_forgetting_factor_ = 0.01f * sample_rate_hz / 48000.f; |
+} |
+ |
+void LevelController::Process(AudioBuffer* audio) { |
+ RTC_DCHECK_LT(0u, audio->num_channels()); |
+ RTC_DCHECK_GE(2u, audio->num_channels()); |
+ RTC_DCHECK_NE(0.f, dc_forgetting_factor_); |
+ RTC_DCHECK(sample_rate_hz_); |
+ data_dumper_->DumpWav("lc_input", audio->num_frames(), |
+ audio->channels_const_f()[0], *sample_rate_hz_, 1); |
+ |
+ // Remove DC level. |
+ for (size_t k = 0; k < audio->num_channels(); ++k) { |
+ UpdateAndRemoveDcLevel( |
+ dc_forgetting_factor_, &dc_level_[k], |
+ rtc::ArrayView<float>(audio->channels_f()[k], audio->num_frames())); |
+ } |
+ |
+ SignalClassifier::SignalType signal_type; |
+ signal_classifier_.Analyze(*audio, &signal_type); |
+ int tmp = static_cast<int>(signal_type); |
+ data_dumper_->DumpRaw("lc_signal_type", 1, &tmp); |
+ |
+ // Estimate the noise energy. |
+ float noise_energy = |
+ noise_level_estimator_.Analyze(signal_type, FrameEnergy(*audio)); |
+ |
+ // Estimate the overall signal peak level. |
+ float peak_level = |
+ peak_level_estimator_.Analyze(signal_type, PeakLevel(*audio)); |
+ |
+ float saturating_gain = saturating_gain_estimator_.GetGain(); |
+ |
+ // Compute the new gain to apply. |
+ float new_gain = gain_selector_.GetNewGain(peak_level, noise_energy, |
+ saturating_gain, signal_type); |
+ |
+ // Apply the gain to the signal. |
+ int num_saturations = gain_applier_.Process(new_gain, audio); |
+ |
+ // Estimate the gain that saturates the overall signal. |
+ saturating_gain_estimator_.Update(new_gain, num_saturations); |
+ |
+ data_dumper_->DumpRaw("lc_selected_gain", 1, &new_gain); |
+ data_dumper_->DumpRaw("lc_noise_energy", 1, &noise_energy); |
+ data_dumper_->DumpRaw("lc_peak_level", 1, &peak_level); |
+ data_dumper_->DumpRaw("lc_saturating_gain", 1, &saturating_gain); |
+ |
+ data_dumper_->DumpWav("lc_output", audio->num_frames(), |
+ audio->channels_f()[0], *sample_rate_hz_, 1); |
+} |
+ |
+} // namespace webrtc |