|  | /* | 
|  | *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved. | 
|  | * | 
|  | *  Use of this source code is governed by a BSD-style license | 
|  | *  that can be found in the LICENSE file in the root of the source | 
|  | *  tree. An additional intellectual property rights grant can be found | 
|  | *  in the file PATENTS.  All contributing project authors may | 
|  | *  be found in the AUTHORS file in the root of the source tree. | 
|  | */ | 
|  |  | 
|  | #include "modules/audio_processing/agc/agc.h" | 
|  |  | 
|  | #include <cmath> | 
|  | #include <cstdint> | 
|  | #include <cstdlib> | 
|  | #include <vector> | 
|  |  | 
|  | #include "api/array_view.h" | 
|  | #include "modules/audio_processing/agc/loudness_histogram.h" | 
|  | #include "modules/audio_processing/agc/utility.h" | 
|  | #include "rtc_base/checks.h" | 
|  |  | 
|  | namespace webrtc { | 
|  | namespace { | 
|  |  | 
|  | constexpr int kDefaultLevelDbfs = -18; | 
|  | constexpr int kNumAnalysisFrames = 100; | 
|  | constexpr double kActivityThreshold = 0.3; | 
|  | constexpr int kNum10msFramesInOneSecond = 100; | 
|  | constexpr int kMaxSampleRateHz = 384000; | 
|  |  | 
|  | }  // namespace | 
|  |  | 
|  | Agc::Agc() | 
|  | : target_level_loudness_(Dbfs2Loudness(kDefaultLevelDbfs)), | 
|  | target_level_dbfs_(kDefaultLevelDbfs), | 
|  | histogram_(LoudnessHistogram::Create(kNumAnalysisFrames)), | 
|  | inactive_histogram_(LoudnessHistogram::Create()) {} | 
|  |  | 
|  | Agc::~Agc() = default; | 
|  |  | 
|  | void Agc::Process(ArrayView<const int16_t> audio) { | 
|  | const int sample_rate_hz = audio.size() * kNum10msFramesInOneSecond; | 
|  | RTC_DCHECK_LE(sample_rate_hz, kMaxSampleRateHz); | 
|  | vad_.ProcessChunk(audio.data(), audio.size(), sample_rate_hz); | 
|  | const std::vector<double>& rms = vad_.chunkwise_rms(); | 
|  | const std::vector<double>& probabilities = | 
|  | vad_.chunkwise_voice_probabilities(); | 
|  | RTC_DCHECK_EQ(rms.size(), probabilities.size()); | 
|  | for (size_t i = 0; i < rms.size(); ++i) { | 
|  | histogram_->Update(rms[i], probabilities[i]); | 
|  | } | 
|  | } | 
|  |  | 
|  | bool Agc::GetRmsErrorDb(int* error) { | 
|  | if (!error) { | 
|  | RTC_DCHECK_NOTREACHED(); | 
|  | return false; | 
|  | } | 
|  |  | 
|  | if (histogram_->num_updates() < kNumAnalysisFrames) { | 
|  | // We haven't yet received enough frames. | 
|  | return false; | 
|  | } | 
|  |  | 
|  | if (histogram_->AudioContent() < kNumAnalysisFrames * kActivityThreshold) { | 
|  | // We are likely in an inactive segment. | 
|  | return false; | 
|  | } | 
|  |  | 
|  | double loudness = Linear2Loudness(histogram_->CurrentRms()); | 
|  | *error = std::floor(Loudness2Db(target_level_loudness_ - loudness) + 0.5); | 
|  | histogram_->Reset(); | 
|  | return true; | 
|  | } | 
|  |  | 
|  | void Agc::Reset() { | 
|  | histogram_->Reset(); | 
|  | } | 
|  |  | 
|  | int Agc::set_target_level_dbfs(int level) { | 
|  | // TODO(turajs): just some arbitrary sanity check. We can come up with better | 
|  | // limits. The upper limit should be chosen such that the risk of clipping is | 
|  | // low. The lower limit should not result in a too quiet signal. | 
|  | if (level >= 0 || level <= -100) | 
|  | return -1; | 
|  | target_level_dbfs_ = level; | 
|  | target_level_loudness_ = Dbfs2Loudness(level); | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | int Agc::target_level_dbfs() const { | 
|  | return target_level_dbfs_; | 
|  | } | 
|  |  | 
|  | float Agc::voice_probability() const { | 
|  | return vad_.last_voice_probability(); | 
|  | } | 
|  |  | 
|  | }  // namespace webrtc |