modules/audio_processing/agc2/adaptive_mode_level_estimator.cc - src - Git at Google

 /*
  *  Copyright (c) 2018 The WebRTC project authors. All Rights Reserved.
  *
  *  Use of this source code is governed by a BSD-style license
  *  that can be found in the LICENSE file in the root of the source
  *  tree. An additional intellectual property rights grant can be found
  *  in the file PATENTS.  All contributing project authors may
  *  be found in the AUTHORS file in the root of the source tree.
  */

 #include "modules/audio_processing/agc2/adaptive_mode_level_estimator.h"

 #include "modules/audio_processing/agc2/agc2_common.h"
 #include "modules/audio_processing/logging/apm_data_dumper.h"
 #include "rtc_base/checks.h"
 #include "rtc_base/numerics/safe_minmax.h"

 namespace webrtc {

 AdaptiveModeLevelEstimator::AdaptiveModeLevelEstimator(
     ApmDataDumper* apm_data_dumper)
     : level_estimator_(
           AudioProcessing::Config::GainController2::LevelEstimator::kRms),
       use_saturation_protector_(true),
       saturation_protector_(apm_data_dumper),
       apm_data_dumper_(apm_data_dumper) {}

 AdaptiveModeLevelEstimator::AdaptiveModeLevelEstimator(
     ApmDataDumper* apm_data_dumper,
     AudioProcessing::Config::GainController2::LevelEstimator level_estimator,
     bool use_saturation_protector,
     float extra_saturation_margin_db)
     : level_estimator_(level_estimator),
       use_saturation_protector_(use_saturation_protector),
       saturation_protector_(apm_data_dumper, extra_saturation_margin_db),
       apm_data_dumper_(apm_data_dumper) {}

 void AdaptiveModeLevelEstimator::UpdateEstimation(
     const VadWithLevel::LevelAndProbability& vad_data) {
   RTC_DCHECK_GT(vad_data.speech_rms_dbfs, -150.f);
   RTC_DCHECK_LT(vad_data.speech_rms_dbfs, 50.f);
   RTC_DCHECK_GT(vad_data.speech_peak_dbfs, -150.f);
   RTC_DCHECK_LT(vad_data.speech_peak_dbfs, 50.f);
   RTC_DCHECK_GE(vad_data.speech_probability, 0.f);
   RTC_DCHECK_LE(vad_data.speech_probability, 1.f);

   if (vad_data.speech_probability < kVadConfidenceThreshold) {
     DebugDumpEstimate();
     return;
   }

   const bool buffer_is_full = buffer_size_ms_ >= kFullBufferSizeMs;
   if (!buffer_is_full) {
     buffer_size_ms_ += kFrameDurationMs;
   }

   const float leak_factor = buffer_is_full ? kFullBufferLeakFactor : 1.f;

   // Read speech level estimation.
   float speech_level_dbfs = 0.f;
   using LevelEstimatorType =
       AudioProcessing::Config::GainController2::LevelEstimator;
   switch (level_estimator_) {
     case LevelEstimatorType::kRms:
       speech_level_dbfs = vad_data.speech_rms_dbfs;
       break;
     case LevelEstimatorType::kPeak:
       speech_level_dbfs = vad_data.speech_peak_dbfs;
       break;
   }

   // Update speech level estimation.
   estimate_numerator_ = estimate_numerator_ * leak_factor +
                         speech_level_dbfs * vad_data.speech_probability;
   estimate_denominator_ =
       estimate_denominator_ * leak_factor + vad_data.speech_probability;
   last_estimate_with_offset_dbfs_ = estimate_numerator_ / estimate_denominator_;

   if (use_saturation_protector_) {
     saturation_protector_.UpdateMargin(vad_data,
                                        last_estimate_with_offset_dbfs_);
     DebugDumpEstimate();
   }
 }

 float AdaptiveModeLevelEstimator::LatestLevelEstimate() const {
   return rtc::SafeClamp<float>(
       last_estimate_with_offset_dbfs_ +
           (use_saturation_protector_ ? saturation_protector_.LastMargin()
                                      : 0.f),
       -90.f, 30.f);
 }

 void AdaptiveModeLevelEstimator::Reset() {
   buffer_size_ms_ = 0;
   last_estimate_with_offset_dbfs_ = kInitialSpeechLevelEstimateDbfs;
   estimate_numerator_ = 0.f;
   estimate_denominator_ = 0.f;
   saturation_protector_.Reset();
 }

 void AdaptiveModeLevelEstimator::DebugDumpEstimate() {
   apm_data_dumper_->DumpRaw("agc2_adaptive_level_estimate_with_offset_dbfs",
                             last_estimate_with_offset_dbfs_);
   apm_data_dumper_->DumpRaw("agc2_adaptive_level_estimate_dbfs",
                             LatestLevelEstimate());
   saturation_protector_.DebugDumpEstimate();
 }
 }  // namespace webrtc
	/*
	* Copyright (c) 2018 The WebRTC project authors. All Rights Reserved.
	*
	* Use of this source code is governed by a BSD-style license
	* that can be found in the LICENSE file in the root of the source
	* tree. An additional intellectual property rights grant can be found
	* in the file PATENTS. All contributing project authors may
	* be found in the AUTHORS file in the root of the source tree.
	*/

	#include "modules/audio_processing/agc2/adaptive_mode_level_estimator.h"

	#include "modules/audio_processing/agc2/agc2_common.h"
	#include "modules/audio_processing/logging/apm_data_dumper.h"
	#include "rtc_base/checks.h"
	#include "rtc_base/numerics/safe_minmax.h"

	namespace webrtc {

	AdaptiveModeLevelEstimator::AdaptiveModeLevelEstimator(
	ApmDataDumper* apm_data_dumper)
	: level_estimator_(
	AudioProcessing::Config::GainController2::LevelEstimator::kRms),
	use_saturation_protector_(true),
	saturation_protector_(apm_data_dumper),
	apm_data_dumper_(apm_data_dumper) {}

	AdaptiveModeLevelEstimator::AdaptiveModeLevelEstimator(
	ApmDataDumper* apm_data_dumper,
	AudioProcessing::Config::GainController2::LevelEstimator level_estimator,
	bool use_saturation_protector,
	float extra_saturation_margin_db)
	: level_estimator_(level_estimator),
	use_saturation_protector_(use_saturation_protector),
	saturation_protector_(apm_data_dumper, extra_saturation_margin_db),
	apm_data_dumper_(apm_data_dumper) {}

	void AdaptiveModeLevelEstimator::UpdateEstimation(
	const VadWithLevel::LevelAndProbability& vad_data) {
	RTC_DCHECK_GT(vad_data.speech_rms_dbfs, -150.f);
	RTC_DCHECK_LT(vad_data.speech_rms_dbfs, 50.f);
	RTC_DCHECK_GT(vad_data.speech_peak_dbfs, -150.f);
	RTC_DCHECK_LT(vad_data.speech_peak_dbfs, 50.f);
	RTC_DCHECK_GE(vad_data.speech_probability, 0.f);
	RTC_DCHECK_LE(vad_data.speech_probability, 1.f);

	if (vad_data.speech_probability < kVadConfidenceThreshold) {
	DebugDumpEstimate();
	return;
	}

	const bool buffer_is_full = buffer_size_ms_ >= kFullBufferSizeMs;
	if (!buffer_is_full) {
	buffer_size_ms_ += kFrameDurationMs;
	}

	const float leak_factor = buffer_is_full ? kFullBufferLeakFactor : 1.f;

	// Read speech level estimation.
	float speech_level_dbfs = 0.f;
	using LevelEstimatorType =
	AudioProcessing::Config::GainController2::LevelEstimator;
	switch (level_estimator_) {
	case LevelEstimatorType::kRms:
	speech_level_dbfs = vad_data.speech_rms_dbfs;
	break;
	case LevelEstimatorType::kPeak:
	speech_level_dbfs = vad_data.speech_peak_dbfs;
	break;
	}

	// Update speech level estimation.
	estimate_numerator_ = estimate_numerator_ * leak_factor +
	speech_level_dbfs * vad_data.speech_probability;
	estimate_denominator_ =
	estimate_denominator_ * leak_factor + vad_data.speech_probability;
	last_estimate_with_offset_dbfs_ = estimate_numerator_ / estimate_denominator_;

	if (use_saturation_protector_) {
	saturation_protector_.UpdateMargin(vad_data,
	last_estimate_with_offset_dbfs_);
	DebugDumpEstimate();
	}
	}

	float AdaptiveModeLevelEstimator::LatestLevelEstimate() const {
	return rtc::SafeClamp<float>(
	last_estimate_with_offset_dbfs_ +
	(use_saturation_protector_ ? saturation_protector_.LastMargin()
	: 0.f),
	-90.f, 30.f);
	}

	void AdaptiveModeLevelEstimator::Reset() {
	buffer_size_ms_ = 0;
	last_estimate_with_offset_dbfs_ = kInitialSpeechLevelEstimateDbfs;
	estimate_numerator_ = 0.f;
	estimate_denominator_ = 0.f;
	saturation_protector_.Reset();
	}

	void AdaptiveModeLevelEstimator::DebugDumpEstimate() {
	apm_data_dumper_->DumpRaw("agc2_adaptive_level_estimate_with_offset_dbfs",
	last_estimate_with_offset_dbfs_);
	apm_data_dumper_->DumpRaw("agc2_adaptive_level_estimate_dbfs",
	LatestLevelEstimate());
	saturation_protector_.DebugDumpEstimate();
	}
	} // namespace webrtc