modules/audio_processing/agc2/saturation_protector.cc - src - Git at Google

 /*
  *  Copyright (c) 2018 The WebRTC project authors. All Rights Reserved.
  *
  *  Use of this source code is governed by a BSD-style license
  *  that can be found in the LICENSE file in the root of the source
  *  tree. An additional intellectual property rights grant can be found
  *  in the file PATENTS.  All contributing project authors may
  *  be found in the AUTHORS file in the root of the source tree.
  */

 #include "modules/audio_processing/agc2/saturation_protector.h"

 #include "modules/audio_processing/logging/apm_data_dumper.h"
 #include "rtc_base/numerics/safe_compare.h"
 #include "rtc_base/numerics/safe_minmax.h"

 namespace webrtc {
 namespace {

 constexpr float kMinLevelDbfs = -90.f;

 // Min/max margins are based on speech crest-factor.
 constexpr float kMinMarginDb = 12.f;
 constexpr float kMaxMarginDb = 25.f;

 }  // namespace

 void SaturationProtector::RingBuffer::Reset() {
   next_ = 0;
   size_ = 0;
 }

 void SaturationProtector::RingBuffer::PushBack(float v) {
   RTC_DCHECK_GE(next_, 0);
   RTC_DCHECK_GE(size_, 0);
   RTC_DCHECK_LT(next_, buffer_.size());
   RTC_DCHECK_LE(size_, buffer_.size());
   buffer_[next_++] = v;
   if (rtc::SafeEq(next_, buffer_.size())) {
     next_ = 0;
   }
   if (rtc::SafeLt(size_, buffer_.size())) {
     size_++;
   }
 }

 absl::optional<float> SaturationProtector::RingBuffer::Front() const {
   if (size_ == 0) {
     return absl::nullopt;
   }
   RTC_DCHECK_LT(next_, buffer_.size());
   return buffer_[rtc::SafeEq(size_, buffer_.size()) ? next_ : 0];
 }

 SaturationProtector::SaturationProtector(ApmDataDumper* apm_data_dumper)
     : SaturationProtector(apm_data_dumper, GetInitialSaturationMarginDb()) {}

 SaturationProtector::SaturationProtector(ApmDataDumper* apm_data_dumper,
                                          float initial_saturation_margin_db)
     : apm_data_dumper_(apm_data_dumper),
       initial_saturation_margin_db_(initial_saturation_margin_db) {
   Reset();
 }

 void SaturationProtector::Reset() {
   margin_db_ = initial_saturation_margin_db_;
   peak_delay_buffer_.Reset();
   max_peaks_dbfs_ = kMinLevelDbfs;
   time_since_push_ms_ = 0;
 }

 void SaturationProtector::UpdateMargin(float speech_peak_dbfs,
                                        float speech_level_dbfs) {
   // Get the max peak over `kPeakEnveloperSuperFrameLengthMs` ms.
   max_peaks_dbfs_ = std::max(max_peaks_dbfs_, speech_peak_dbfs);
   time_since_push_ms_ += kFrameDurationMs;
   if (time_since_push_ms_ >
       static_cast<int>(kPeakEnveloperSuperFrameLengthMs)) {
     // Push `max_peaks_dbfs_` back into the ring buffer.
     peak_delay_buffer_.PushBack(max_peaks_dbfs_);
     // Reset.
     max_peaks_dbfs_ = kMinLevelDbfs;
     time_since_push_ms_ = 0;
   }

   // Update margin by comparing the estimated speech level and the delayed max
   // speech peak power.
   // TODO(alessiob): Check with aleloi@ why we use a delay and how to tune it.
   const float difference_db = GetDelayedPeakDbfs() - speech_level_dbfs;
   if (margin_db_ < difference_db) {
     margin_db_ = margin_db_ * kSaturationProtectorAttackConstant +
                  difference_db * (1.f - kSaturationProtectorAttackConstant);
   } else {
     margin_db_ = margin_db_ * kSaturationProtectorDecayConstant +
                  difference_db * (1.f - kSaturationProtectorDecayConstant);
   }

   margin_db_ = rtc::SafeClamp<float>(margin_db_, kMinMarginDb, kMaxMarginDb);
 }

 float SaturationProtector::GetDelayedPeakDbfs() const {
   return peak_delay_buffer_.Front().value_or(max_peaks_dbfs_);
 }

 void SaturationProtector::DebugDumpEstimate() const {
   if (apm_data_dumper_) {
     apm_data_dumper_->DumpRaw(
         "agc2_adaptive_saturation_protector_delayed_peak_dbfs",
         GetDelayedPeakDbfs());
     apm_data_dumper_->DumpRaw("agc2_adaptive_saturation_margin_db", margin_db_);
   }
 }

 }  // namespace webrtc
	/*
	* Copyright (c) 2018 The WebRTC project authors. All Rights Reserved.
	*
	* Use of this source code is governed by a BSD-style license
	* that can be found in the LICENSE file in the root of the source
	* tree. An additional intellectual property rights grant can be found
	* in the file PATENTS. All contributing project authors may
	* be found in the AUTHORS file in the root of the source tree.
	*/

	#include "modules/audio_processing/agc2/saturation_protector.h"

	#include "modules/audio_processing/logging/apm_data_dumper.h"
	#include "rtc_base/numerics/safe_compare.h"
	#include "rtc_base/numerics/safe_minmax.h"

	namespace webrtc {
	namespace {

	constexpr float kMinLevelDbfs = -90.f;

	// Min/max margins are based on speech crest-factor.
	constexpr float kMinMarginDb = 12.f;
	constexpr float kMaxMarginDb = 25.f;

	} // namespace

	void SaturationProtector::RingBuffer::Reset() {
	next_ = 0;
	size_ = 0;
	}

	void SaturationProtector::RingBuffer::PushBack(float v) {
	RTC_DCHECK_GE(next_, 0);
	RTC_DCHECK_GE(size_, 0);
	RTC_DCHECK_LT(next_, buffer_.size());
	RTC_DCHECK_LE(size_, buffer_.size());
	buffer_[next_++] = v;
	if (rtc::SafeEq(next_, buffer_.size())) {
	next_ = 0;
	}
	if (rtc::SafeLt(size_, buffer_.size())) {
	size_++;
	}
	}

	absl::optional<float> SaturationProtector::RingBuffer::Front() const {
	if (size_ == 0) {
	return absl::nullopt;
	}
	RTC_DCHECK_LT(next_, buffer_.size());
	return buffer_[rtc::SafeEq(size_, buffer_.size()) ? next_ : 0];
	}

	SaturationProtector::SaturationProtector(ApmDataDumper* apm_data_dumper)
	: SaturationProtector(apm_data_dumper, GetInitialSaturationMarginDb()) {}

	SaturationProtector::SaturationProtector(ApmDataDumper* apm_data_dumper,
	float initial_saturation_margin_db)
	: apm_data_dumper_(apm_data_dumper),
	initial_saturation_margin_db_(initial_saturation_margin_db) {
	Reset();
	}

	void SaturationProtector::Reset() {
	margin_db_ = initial_saturation_margin_db_;
	peak_delay_buffer_.Reset();
	max_peaks_dbfs_ = kMinLevelDbfs;
	time_since_push_ms_ = 0;
	}

	void SaturationProtector::UpdateMargin(float speech_peak_dbfs,
	float speech_level_dbfs) {
	// Get the max peak over `kPeakEnveloperSuperFrameLengthMs` ms.
	max_peaks_dbfs_ = std::max(max_peaks_dbfs_, speech_peak_dbfs);
	time_since_push_ms_ += kFrameDurationMs;
	if (time_since_push_ms_ >
	static_cast<int>(kPeakEnveloperSuperFrameLengthMs)) {
	// Push `max_peaks_dbfs_` back into the ring buffer.
	peak_delay_buffer_.PushBack(max_peaks_dbfs_);
	// Reset.
	max_peaks_dbfs_ = kMinLevelDbfs;
	time_since_push_ms_ = 0;
	}

	// Update margin by comparing the estimated speech level and the delayed max
	// speech peak power.
	// TODO(alessiob): Check with aleloi@ why we use a delay and how to tune it.
	const float difference_db = GetDelayedPeakDbfs() - speech_level_dbfs;
	if (margin_db_ < difference_db) {
	margin_db_ = margin_db_ * kSaturationProtectorAttackConstant +
	difference_db * (1.f - kSaturationProtectorAttackConstant);
	} else {
	margin_db_ = margin_db_ * kSaturationProtectorDecayConstant +
	difference_db * (1.f - kSaturationProtectorDecayConstant);
	}

	margin_db_ = rtc::SafeClamp<float>(margin_db_, kMinMarginDb, kMaxMarginDb);
	}

	float SaturationProtector::GetDelayedPeakDbfs() const {
	return peak_delay_buffer_.Front().value_or(max_peaks_dbfs_);
	}

	void SaturationProtector::DebugDumpEstimate() const {
	if (apm_data_dumper_) {
	apm_data_dumper_->DumpRaw(
	"agc2_adaptive_saturation_protector_delayed_peak_dbfs",
	GetDelayedPeakDbfs());
	apm_data_dumper_->DumpRaw("agc2_adaptive_saturation_margin_db", margin_db_);
	}
	}

	} // namespace webrtc