modules/audio_processing/agc/agc.cc - src - Git at Google

 /*
  *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
  *
  *  Use of this source code is governed by a BSD-style license
  *  that can be found in the LICENSE file in the root of the source
  *  tree. An additional intellectual property rights grant can be found
  *  in the file PATENTS.  All contributing project authors may
  *  be found in the AUTHORS file in the root of the source tree.
  */

 #include "modules/audio_processing/agc/agc.h"

 #include <cmath>
 #include <cstdint>
 #include <cstdlib>
 #include <vector>

 #include "api/array_view.h"
 #include "modules/audio_processing/agc/loudness_histogram.h"
 #include "modules/audio_processing/agc/utility.h"
 #include "rtc_base/checks.h"

 namespace webrtc {
 namespace {

 constexpr int kDefaultLevelDbfs = -18;
 constexpr int kNumAnalysisFrames = 100;
 constexpr double kActivityThreshold = 0.3;
 constexpr int kNum10msFramesInOneSecond = 100;
 constexpr int kMaxSampleRateHz = 384000;

 }  // namespace

 Agc::Agc()
     : target_level_loudness_(Dbfs2Loudness(kDefaultLevelDbfs)),
       target_level_dbfs_(kDefaultLevelDbfs),
       histogram_(LoudnessHistogram::Create(kNumAnalysisFrames)),
       inactive_histogram_(LoudnessHistogram::Create()) {}

 Agc::~Agc() = default;

 void Agc::Process(ArrayView<const int16_t> audio) {
   const int sample_rate_hz = audio.size() * kNum10msFramesInOneSecond;
   RTC_DCHECK_LE(sample_rate_hz, kMaxSampleRateHz);
   vad_.ProcessChunk(audio.data(), audio.size(), sample_rate_hz);
   const std::vector<double>& rms = vad_.chunkwise_rms();
   const std::vector<double>& probabilities =
       vad_.chunkwise_voice_probabilities();
   RTC_DCHECK_EQ(rms.size(), probabilities.size());
   for (size_t i = 0; i < rms.size(); ++i) {
     histogram_->Update(rms[i], probabilities[i]);
   }
 }

 bool Agc::GetRmsErrorDb(int* error) {
   if (!error) {
     RTC_DCHECK_NOTREACHED();
     return false;
   }

   if (histogram_->num_updates() < kNumAnalysisFrames) {
     // We haven't yet received enough frames.
     return false;
   }

   if (histogram_->AudioContent() < kNumAnalysisFrames * kActivityThreshold) {
     // We are likely in an inactive segment.
     return false;
   }

   double loudness = Linear2Loudness(histogram_->CurrentRms());
   *error = std::floor(Loudness2Db(target_level_loudness_ - loudness) + 0.5);
   histogram_->Reset();
   return true;
 }

 void Agc::Reset() {
   histogram_->Reset();
 }

 int Agc::set_target_level_dbfs(int level) {
   // TODO(turajs): just some arbitrary sanity check. We can come up with better
   // limits. The upper limit should be chosen such that the risk of clipping is
   // low. The lower limit should not result in a too quiet signal.
   if (level >= 0 || level <= -100)
     return -1;
   target_level_dbfs_ = level;
   target_level_loudness_ = Dbfs2Loudness(level);
   return 0;
 }

 int Agc::target_level_dbfs() const {
   return target_level_dbfs_;
 }

 float Agc::voice_probability() const {
   return vad_.last_voice_probability();
 }

 }  // namespace webrtc
	/*
	* Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
	*
	* Use of this source code is governed by a BSD-style license
	* that can be found in the LICENSE file in the root of the source
	* tree. An additional intellectual property rights grant can be found
	* in the file PATENTS. All contributing project authors may
	* be found in the AUTHORS file in the root of the source tree.
	*/

	#include "modules/audio_processing/agc/agc.h"

	#include <cmath>
	#include <cstdint>
	#include <cstdlib>
	#include <vector>

	#include "api/array_view.h"
	#include "modules/audio_processing/agc/loudness_histogram.h"
	#include "modules/audio_processing/agc/utility.h"
	#include "rtc_base/checks.h"

	namespace webrtc {
	namespace {

	constexpr int kDefaultLevelDbfs = -18;
	constexpr int kNumAnalysisFrames = 100;
	constexpr double kActivityThreshold = 0.3;
	constexpr int kNum10msFramesInOneSecond = 100;
	constexpr int kMaxSampleRateHz = 384000;

	} // namespace

	Agc::Agc()
	: target_level_loudness_(Dbfs2Loudness(kDefaultLevelDbfs)),
	target_level_dbfs_(kDefaultLevelDbfs),
	histogram_(LoudnessHistogram::Create(kNumAnalysisFrames)),
	inactive_histogram_(LoudnessHistogram::Create()) {}

	Agc::~Agc() = default;

	void Agc::Process(ArrayView<const int16_t> audio) {
	const int sample_rate_hz = audio.size() * kNum10msFramesInOneSecond;
	RTC_DCHECK_LE(sample_rate_hz, kMaxSampleRateHz);
	vad_.ProcessChunk(audio.data(), audio.size(), sample_rate_hz);
	const std::vector<double>& rms = vad_.chunkwise_rms();
	const std::vector<double>& probabilities =
	vad_.chunkwise_voice_probabilities();
	RTC_DCHECK_EQ(rms.size(), probabilities.size());
	for (size_t i = 0; i < rms.size(); ++i) {
	histogram_->Update(rms[i], probabilities[i]);
	}
	}

	bool Agc::GetRmsErrorDb(int* error) {
	if (!error) {
	RTC_DCHECK_NOTREACHED();
	return false;
	}

	if (histogram_->num_updates() < kNumAnalysisFrames) {
	// We haven't yet received enough frames.
	return false;
	}

	if (histogram_->AudioContent() < kNumAnalysisFrames * kActivityThreshold) {
	// We are likely in an inactive segment.
	return false;
	}

	double loudness = Linear2Loudness(histogram_->CurrentRms());
	*error = std::floor(Loudness2Db(target_level_loudness_ - loudness) + 0.5);
	histogram_->Reset();
	return true;
	}

	void Agc::Reset() {
	histogram_->Reset();
	}

	int Agc::set_target_level_dbfs(int level) {
	// TODO(turajs): just some arbitrary sanity check. We can come up with better
	// limits. The upper limit should be chosen such that the risk of clipping is
	// low. The lower limit should not result in a too quiet signal.
	if (level >= 0 \|\| level <= -100)
	return -1;
	target_level_dbfs_ = level;
	target_level_loudness_ = Dbfs2Loudness(level);
	return 0;
	}

	int Agc::target_level_dbfs() const {
	return target_level_dbfs_;
	}

	float Agc::voice_probability() const {
	return vad_.last_voice_probability();
	}

	} // namespace webrtc