modules/audio_processing/agc2/adaptive_digital_gain_applier.cc - src - Git at Google

 /*
  *  Copyright (c) 2018 The WebRTC project authors. All Rights Reserved.
  *
  *  Use of this source code is governed by a BSD-style license
  *  that can be found in the LICENSE file in the root of the source
  *  tree. An additional intellectual property rights grant can be found
  *  in the file PATENTS.  All contributing project authors may
  *  be found in the AUTHORS file in the root of the source tree.
  */

 #include "modules/audio_processing/agc2/adaptive_digital_gain_applier.h"

 #include <algorithm>

 #include "common_audio/include/audio_util.h"
 #include "modules/audio_processing/agc2/agc2_common.h"
 #include "modules/audio_processing/logging/apm_data_dumper.h"
 #include "rtc_base/checks.h"
 #include "rtc_base/numerics/safe_minmax.h"
 #include "system_wrappers/include/metrics.h"

 namespace webrtc {
 namespace {

 // This function maps input level to desired applied gain. We want to
 // boost the signal so that peaks are at -kHeadroomDbfs. We can't
 // apply more than kMaxGainDb gain.
 float ComputeGainDb(float input_level_dbfs) {
   // If the level is very low, boost it as much as we can.
   if (input_level_dbfs < -(kHeadroomDbfs + kMaxGainDb)) {
     return kMaxGainDb;
   }

   // We expect to end up here most of the time: the level is below
   // -headroom, but we can boost it to -headroom.
   if (input_level_dbfs < -kHeadroomDbfs) {
     return -kHeadroomDbfs - input_level_dbfs;
   }

   // Otherwise, the level is too high and we can't boost. The
   // LevelEstimator is responsible for not reporting bogus gain
   // values.
   RTC_DCHECK_LE(input_level_dbfs, 0.f);
   return 0.f;
 }

 // We require 'gain + noise_level <= kMaxNoiseLevelDbfs'.
 float LimitGainByNoise(float target_gain,
                        float input_noise_level_dbfs,
                        ApmDataDumper* apm_data_dumper) {
   const float noise_headroom_db = kMaxNoiseLevelDbfs - input_noise_level_dbfs;
   apm_data_dumper->DumpRaw("agc2_noise_headroom_db", noise_headroom_db);
   return std::min(target_gain, std::max(noise_headroom_db, 0.f));
 }

 float LimitGainByLowConfidence(float target_gain,
                                float last_gain,
                                float limiter_audio_level_dbfs,
                                bool estimate_is_confident) {
   if (estimate_is_confident ||
       limiter_audio_level_dbfs <= kLimiterThresholdForAgcGainDbfs) {
     return target_gain;
   }
   const float limiter_level_before_gain = limiter_audio_level_dbfs - last_gain;

   // Compute a new gain so that limiter_level_before_gain + new_gain <=
   // kLimiterThreshold.
   const float new_target_gain = std::max(
       kLimiterThresholdForAgcGainDbfs - limiter_level_before_gain, 0.f);
   return std::min(new_target_gain, target_gain);
 }

 // Computes how the gain should change during this frame.
 // Return the gain difference in db to 'last_gain_db'.
 float ComputeGainChangeThisFrameDb(float target_gain_db,
                                    float last_gain_db,
                                    bool gain_increase_allowed) {
   float target_gain_difference_db = target_gain_db - last_gain_db;
   if (!gain_increase_allowed) {
     target_gain_difference_db = std::min(target_gain_difference_db, 0.f);
   }

   return rtc::SafeClamp(target_gain_difference_db, -kMaxGainChangePerFrameDb,
                         kMaxGainChangePerFrameDb);
 }
 }  // namespace

 SignalWithLevels::SignalWithLevels(AudioFrameView<float> float_frame)
     : float_frame(float_frame) {}
 SignalWithLevels::SignalWithLevels(const SignalWithLevels&) = default;

 AdaptiveDigitalGainApplier::AdaptiveDigitalGainApplier(
     ApmDataDumper* apm_data_dumper)
     : gain_applier_(false, DbToRatio(last_gain_db_)),
       apm_data_dumper_(apm_data_dumper) {}

 void AdaptiveDigitalGainApplier::Process(SignalWithLevels signal_with_levels) {
   calls_since_last_gain_log_++;
   if (calls_since_last_gain_log_ == 100) {
     calls_since_last_gain_log_ = 0;
     RTC_HISTOGRAM_COUNTS_LINEAR("WebRTC.Audio.Agc2.DigitalGainApplied",
                                 last_gain_db_, 0, kMaxGainDb, kMaxGainDb + 1);
     RTC_HISTOGRAM_COUNTS_LINEAR("WebRTC.Audio.Agc2.EstimatedNoiseLevel",
                                 -signal_with_levels.input_noise_level_dbfs, 0,
                                 100, 101);
   }

   signal_with_levels.input_level_dbfs =
       std::min(signal_with_levels.input_level_dbfs, 0.f);

   RTC_DCHECK_GE(signal_with_levels.input_level_dbfs, -150.f);
   RTC_DCHECK_GE(signal_with_levels.float_frame.num_channels(), 1);
   RTC_DCHECK_GE(signal_with_levels.float_frame.samples_per_channel(), 1);

   const float target_gain_db = LimitGainByLowConfidence(
       LimitGainByNoise(ComputeGainDb(signal_with_levels.input_level_dbfs),
                        signal_with_levels.input_noise_level_dbfs,
                        apm_data_dumper_),
       last_gain_db_, signal_with_levels.limiter_audio_level_dbfs,
       signal_with_levels.estimate_is_confident);

   // Forbid increasing the gain when there is no speech.
   gain_increase_allowed_ = signal_with_levels.vad_result.speech_probability >
                            kVadConfidenceThreshold;

   const float gain_change_this_frame_db = ComputeGainChangeThisFrameDb(
       target_gain_db, last_gain_db_, gain_increase_allowed_);

   apm_data_dumper_->DumpRaw("agc2_want_to_change_by_db",
                             target_gain_db - last_gain_db_);
   apm_data_dumper_->DumpRaw("agc2_will_change_by_db",
                             gain_change_this_frame_db);

   // Optimization: avoid calling math functions if gain does not
   // change.
   if (gain_change_this_frame_db != 0.f) {
     gain_applier_.SetGainFactor(
         DbToRatio(last_gain_db_ + gain_change_this_frame_db));
   }
   gain_applier_.ApplyGain(signal_with_levels.float_frame);

   // Remember that the gain has changed for the next iteration.
   last_gain_db_ = last_gain_db_ + gain_change_this_frame_db;
   apm_data_dumper_->DumpRaw("agc2_applied_gain_db", last_gain_db_);
 }
 }  // namespace webrtc
	/*
	* Copyright (c) 2018 The WebRTC project authors. All Rights Reserved.
	*
	* Use of this source code is governed by a BSD-style license
	* that can be found in the LICENSE file in the root of the source
	* tree. An additional intellectual property rights grant can be found
	* in the file PATENTS. All contributing project authors may
	* be found in the AUTHORS file in the root of the source tree.
	*/

	#include "modules/audio_processing/agc2/adaptive_digital_gain_applier.h"

	#include <algorithm>

	#include "common_audio/include/audio_util.h"
	#include "modules/audio_processing/agc2/agc2_common.h"
	#include "modules/audio_processing/logging/apm_data_dumper.h"
	#include "rtc_base/checks.h"
	#include "rtc_base/numerics/safe_minmax.h"
	#include "system_wrappers/include/metrics.h"

	namespace webrtc {
	namespace {

	// This function maps input level to desired applied gain. We want to
	// boost the signal so that peaks are at -kHeadroomDbfs. We can't
	// apply more than kMaxGainDb gain.
	float ComputeGainDb(float input_level_dbfs) {
	// If the level is very low, boost it as much as we can.
	if (input_level_dbfs < -(kHeadroomDbfs + kMaxGainDb)) {
	return kMaxGainDb;
	}

	// We expect to end up here most of the time: the level is below
	// -headroom, but we can boost it to -headroom.
	if (input_level_dbfs < -kHeadroomDbfs) {
	return -kHeadroomDbfs - input_level_dbfs;
	}

	// Otherwise, the level is too high and we can't boost. The
	// LevelEstimator is responsible for not reporting bogus gain
	// values.
	RTC_DCHECK_LE(input_level_dbfs, 0.f);
	return 0.f;
	}

	// We require 'gain + noise_level <= kMaxNoiseLevelDbfs'.
	float LimitGainByNoise(float target_gain,
	float input_noise_level_dbfs,
	ApmDataDumper* apm_data_dumper) {
	const float noise_headroom_db = kMaxNoiseLevelDbfs - input_noise_level_dbfs;
	apm_data_dumper->DumpRaw("agc2_noise_headroom_db", noise_headroom_db);
	return std::min(target_gain, std::max(noise_headroom_db, 0.f));
	}

	float LimitGainByLowConfidence(float target_gain,
	float last_gain,
	float limiter_audio_level_dbfs,
	bool estimate_is_confident) {
	if (estimate_is_confident \|\|
	limiter_audio_level_dbfs <= kLimiterThresholdForAgcGainDbfs) {
	return target_gain;
	}
	const float limiter_level_before_gain = limiter_audio_level_dbfs - last_gain;

	// Compute a new gain so that limiter_level_before_gain + new_gain <=
	// kLimiterThreshold.
	const float new_target_gain = std::max(
	kLimiterThresholdForAgcGainDbfs - limiter_level_before_gain, 0.f);
	return std::min(new_target_gain, target_gain);
	}

	// Computes how the gain should change during this frame.
	// Return the gain difference in db to 'last_gain_db'.
	float ComputeGainChangeThisFrameDb(float target_gain_db,
	float last_gain_db,
	bool gain_increase_allowed) {
	float target_gain_difference_db = target_gain_db - last_gain_db;
	if (!gain_increase_allowed) {
	target_gain_difference_db = std::min(target_gain_difference_db, 0.f);
	}

	return rtc::SafeClamp(target_gain_difference_db, -kMaxGainChangePerFrameDb,
	kMaxGainChangePerFrameDb);
	}
	} // namespace

	SignalWithLevels::SignalWithLevels(AudioFrameView<float> float_frame)
	: float_frame(float_frame) {}
	SignalWithLevels::SignalWithLevels(const SignalWithLevels&) = default;

	AdaptiveDigitalGainApplier::AdaptiveDigitalGainApplier(
	ApmDataDumper* apm_data_dumper)
	: gain_applier_(false, DbToRatio(last_gain_db_)),
	apm_data_dumper_(apm_data_dumper) {}

	void AdaptiveDigitalGainApplier::Process(SignalWithLevels signal_with_levels) {
	calls_since_last_gain_log_++;
	if (calls_since_last_gain_log_ == 100) {
	calls_since_last_gain_log_ = 0;
	RTC_HISTOGRAM_COUNTS_LINEAR("WebRTC.Audio.Agc2.DigitalGainApplied",
	last_gain_db_, 0, kMaxGainDb, kMaxGainDb + 1);
	RTC_HISTOGRAM_COUNTS_LINEAR("WebRTC.Audio.Agc2.EstimatedNoiseLevel",
	-signal_with_levels.input_noise_level_dbfs, 0,
	100, 101);
	}

	signal_with_levels.input_level_dbfs =
	std::min(signal_with_levels.input_level_dbfs, 0.f);

	RTC_DCHECK_GE(signal_with_levels.input_level_dbfs, -150.f);
	RTC_DCHECK_GE(signal_with_levels.float_frame.num_channels(), 1);
	RTC_DCHECK_GE(signal_with_levels.float_frame.samples_per_channel(), 1);

	const float target_gain_db = LimitGainByLowConfidence(
	LimitGainByNoise(ComputeGainDb(signal_with_levels.input_level_dbfs),
	signal_with_levels.input_noise_level_dbfs,
	apm_data_dumper_),
	last_gain_db_, signal_with_levels.limiter_audio_level_dbfs,
	signal_with_levels.estimate_is_confident);

	// Forbid increasing the gain when there is no speech.
	gain_increase_allowed_ = signal_with_levels.vad_result.speech_probability >
	kVadConfidenceThreshold;

	const float gain_change_this_frame_db = ComputeGainChangeThisFrameDb(
	target_gain_db, last_gain_db_, gain_increase_allowed_);

	apm_data_dumper_->DumpRaw("agc2_want_to_change_by_db",
	target_gain_db - last_gain_db_);
	apm_data_dumper_->DumpRaw("agc2_will_change_by_db",
	gain_change_this_frame_db);

	// Optimization: avoid calling math functions if gain does not
	// change.
	if (gain_change_this_frame_db != 0.f) {
	gain_applier_.SetGainFactor(
	DbToRatio(last_gain_db_ + gain_change_this_frame_db));
	}
	gain_applier_.ApplyGain(signal_with_levels.float_frame);

	// Remember that the gain has changed for the next iteration.
	last_gain_db_ = last_gain_db_ + gain_change_this_frame_db;
	apm_data_dumper_->DumpRaw("agc2_applied_gain_db", last_gain_db_);
	}
	} // namespace webrtc