/* * Copyright (c) 2018 The WebRTC project authors. All Rights Reserved. * * Use of this source code is governed by a BSD-style license * that can be found in the LICENSE file in the root of the source * tree. An additional intellectual property rights grant can be found * in the file PATENTS. All contributing project authors may * be found in the AUTHORS file in the root of the source tree. */ #include "modules/audio_processing/agc2/adaptive_mode_level_estimator.h" #include "modules/audio_processing/agc2/agc2_common.h" #include "modules/audio_processing/logging/apm_data_dumper.h" #include "rtc_base/checks.h" #include "rtc_base/numerics/safe_minmax.h" namespace webrtc { AdaptiveModeLevelEstimator::AdaptiveModeLevelEstimator( ApmDataDumper* apm_data_dumper) : level_estimator_( AudioProcessing::Config::GainController2::LevelEstimator::kRms), use_saturation_protector_(true), saturation_protector_(apm_data_dumper), apm_data_dumper_(apm_data_dumper) {} AdaptiveModeLevelEstimator::AdaptiveModeLevelEstimator( ApmDataDumper* apm_data_dumper, AudioProcessing::Config::GainController2::LevelEstimator level_estimator, bool use_saturation_protector, float extra_saturation_margin_db) : level_estimator_(level_estimator), use_saturation_protector_(use_saturation_protector), saturation_protector_(apm_data_dumper, extra_saturation_margin_db), apm_data_dumper_(apm_data_dumper) {} void AdaptiveModeLevelEstimator::UpdateEstimation( const VadWithLevel::LevelAndProbability& vad_data) { RTC_DCHECK_GT(vad_data.speech_rms_dbfs, -150.f); RTC_DCHECK_LT(vad_data.speech_rms_dbfs, 50.f); RTC_DCHECK_GT(vad_data.speech_peak_dbfs, -150.f); RTC_DCHECK_LT(vad_data.speech_peak_dbfs, 50.f); RTC_DCHECK_GE(vad_data.speech_probability, 0.f); RTC_DCHECK_LE(vad_data.speech_probability, 1.f); if (vad_data.speech_probability < kVadConfidenceThreshold) { DebugDumpEstimate(); return; } const bool buffer_is_full = buffer_size_ms_ >= kFullBufferSizeMs; if (!buffer_is_full) { buffer_size_ms_ += kFrameDurationMs; } const float leak_factor = buffer_is_full ? kFullBufferLeakFactor : 1.f; // Read speech level estimation. float speech_level_dbfs = 0.f; using LevelEstimatorType = AudioProcessing::Config::GainController2::LevelEstimator; switch (level_estimator_) { case LevelEstimatorType::kRms: speech_level_dbfs = vad_data.speech_rms_dbfs; break; case LevelEstimatorType::kPeak: speech_level_dbfs = vad_data.speech_peak_dbfs; break; } // Update speech level estimation. estimate_numerator_ = estimate_numerator_ * leak_factor + speech_level_dbfs * vad_data.speech_probability; estimate_denominator_ = estimate_denominator_ * leak_factor + vad_data.speech_probability; last_estimate_with_offset_dbfs_ = estimate_numerator_ / estimate_denominator_; if (use_saturation_protector_) { saturation_protector_.UpdateMargin(vad_data, last_estimate_with_offset_dbfs_); DebugDumpEstimate(); } } float AdaptiveModeLevelEstimator::LatestLevelEstimate() const { return rtc::SafeClamp( last_estimate_with_offset_dbfs_ + (use_saturation_protector_ ? saturation_protector_.LastMargin() : 0.f), -90.f, 30.f); } void AdaptiveModeLevelEstimator::Reset() { buffer_size_ms_ = 0; last_estimate_with_offset_dbfs_ = kInitialSpeechLevelEstimateDbfs; estimate_numerator_ = 0.f; estimate_denominator_ = 0.f; saturation_protector_.Reset(); } void AdaptiveModeLevelEstimator::DebugDumpEstimate() { if (apm_data_dumper_) { apm_data_dumper_->DumpRaw("agc2_adaptive_level_estimate_with_offset_dbfs", last_estimate_with_offset_dbfs_); apm_data_dumper_->DumpRaw("agc2_adaptive_level_estimate_dbfs", LatestLevelEstimate()); } saturation_protector_.DebugDumpEstimate(); } } // namespace webrtc