modules/audio_processing/agc2/speech_level_estimator.h - src/ - Git at Google

 /*
  *  Copyright (c) 2018 The WebRTC project authors. All Rights Reserved.
  *
  *  Use of this source code is governed by a BSD-style license
  *  that can be found in the LICENSE file in the root of the source
  *  tree. An additional intellectual property rights grant can be found
  *  in the file PATENTS.  All contributing project authors may
  *  be found in the AUTHORS file in the root of the source tree.
  */

 #ifndef MODULES_AUDIO_PROCESSING_AGC2_SPEECH_LEVEL_ESTIMATOR_H_
 #define MODULES_AUDIO_PROCESSING_AGC2_SPEECH_LEVEL_ESTIMATOR_H_

 #include <stddef.h>

 #include <type_traits>

 #include "modules/audio_processing/agc2/agc2_common.h"
 #include "modules/audio_processing/include/audio_processing.h"

 namespace webrtc {
 class ApmDataDumper;

 // Active speech level estimator based on the analysis of the following
 // framewise properties: RMS level (dBFS), peak level (dBFS), speech
 // probability.
 class SpeechLevelEstimator {
  public:
   SpeechLevelEstimator(
       ApmDataDumper* apm_data_dumper,
       const AudioProcessing::Config::GainController2::AdaptiveDigital& config,
       int adjacent_speech_frames_threshold);
   SpeechLevelEstimator(const SpeechLevelEstimator&) = delete;
   SpeechLevelEstimator& operator=(const SpeechLevelEstimator&) = delete;

   // Updates the level estimation.
   void Update(float rms_dbfs, float peak_dbfs, float speech_probability);
   // Returns the estimated speech plus noise level.
   float level_dbfs() const { return level_dbfs_; }
   // Returns true if the estimator is confident on its current estimate.
   bool is_confident() const { return is_confident_; }

   void Reset();

  private:
   // Part of the level estimator state used for check-pointing and restore ops.
   struct LevelEstimatorState {
     bool operator==(const LevelEstimatorState& s) const;
     inline bool operator!=(const LevelEstimatorState& s) const {
       return !(*this == s);
     }
     // TODO(bugs.webrtc.org/7494): Remove `time_to_confidence_ms` if redundant.
     int time_to_confidence_ms;
     struct Ratio {
       float numerator;
       float denominator;
       float GetRatio() const;
     } level_dbfs;
   };
   static_assert(std::is_trivially_copyable<LevelEstimatorState>::value, "");

   void UpdateIsConfident();

   void ResetLevelEstimatorState(LevelEstimatorState& state) const;

   void DumpDebugData() const;

   ApmDataDumper* const apm_data_dumper_;

   const float initial_speech_level_dbfs_;
   const int adjacent_speech_frames_threshold_;
   LevelEstimatorState preliminary_state_;
   LevelEstimatorState reliable_state_;
   float level_dbfs_;
   bool is_confident_;
   int num_adjacent_speech_frames_;
 };

 }  // namespace webrtc

 #endif  // MODULES_AUDIO_PROCESSING_AGC2_SPEECH_LEVEL_ESTIMATOR_H_
	/*
	* Copyright (c) 2018 The WebRTC project authors. All Rights Reserved.
	*
	* Use of this source code is governed by a BSD-style license
	* that can be found in the LICENSE file in the root of the source
	* tree. An additional intellectual property rights grant can be found
	* in the file PATENTS. All contributing project authors may
	* be found in the AUTHORS file in the root of the source tree.
	*/

	#ifndef MODULES_AUDIO_PROCESSING_AGC2_SPEECH_LEVEL_ESTIMATOR_H_
	#define MODULES_AUDIO_PROCESSING_AGC2_SPEECH_LEVEL_ESTIMATOR_H_

	#include <stddef.h>

	#include <type_traits>

	#include "modules/audio_processing/agc2/agc2_common.h"
	#include "modules/audio_processing/include/audio_processing.h"

	namespace webrtc {
	class ApmDataDumper;

	// Active speech level estimator based on the analysis of the following
	// framewise properties: RMS level (dBFS), peak level (dBFS), speech
	// probability.
	class SpeechLevelEstimator {
	public:
	SpeechLevelEstimator(
	ApmDataDumper* apm_data_dumper,
	const AudioProcessing::Config::GainController2::AdaptiveDigital& config,
	int adjacent_speech_frames_threshold);
	SpeechLevelEstimator(const SpeechLevelEstimator&) = delete;
	SpeechLevelEstimator& operator=(const SpeechLevelEstimator&) = delete;

	// Updates the level estimation.
	void Update(float rms_dbfs, float peak_dbfs, float speech_probability);
	// Returns the estimated speech plus noise level.
	float level_dbfs() const { return level_dbfs_; }
	// Returns true if the estimator is confident on its current estimate.
	bool is_confident() const { return is_confident_; }

	void Reset();

	private:
	// Part of the level estimator state used for check-pointing and restore ops.
	struct LevelEstimatorState {
	bool operator==(const LevelEstimatorState& s) const;
	inline bool operator!=(const LevelEstimatorState& s) const {
	return !(*this == s);
	}
	// TODO(bugs.webrtc.org/7494): Remove `time_to_confidence_ms` if redundant.
	int time_to_confidence_ms;
	struct Ratio {
	float numerator;
	float denominator;
	float GetRatio() const;
	} level_dbfs;
	};
	static_assert(std::is_trivially_copyable<LevelEstimatorState>::value, "");

	void UpdateIsConfident();

	void ResetLevelEstimatorState(LevelEstimatorState& state) const;

	void DumpDebugData() const;

	ApmDataDumper* const apm_data_dumper_;

	const float initial_speech_level_dbfs_;
	const int adjacent_speech_frames_threshold_;
	LevelEstimatorState preliminary_state_;
	LevelEstimatorState reliable_state_;
	float level_dbfs_;
	bool is_confident_;
	int num_adjacent_speech_frames_;
	};

	} // namespace webrtc

	#endif // MODULES_AUDIO_PROCESSING_AGC2_SPEECH_LEVEL_ESTIMATOR_H_