modules/audio_processing/ns/noise_suppressor.h - src - Git at Google

 /*
  *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
  *
  *  Use of this source code is governed by a BSD-style license
  *  that can be found in the LICENSE file in the root of the source
  *  tree. An additional intellectual property rights grant can be found
  *  in the file PATENTS.  All contributing project authors may
  *  be found in the AUTHORS file in the root of the source tree.
  */

 #ifndef MODULES_AUDIO_PROCESSING_NS_NOISE_SUPPRESSOR_H_
 #define MODULES_AUDIO_PROCESSING_NS_NOISE_SUPPRESSOR_H_

 #include <memory>
 #include <vector>

 #include "api/array_view.h"
 #include "modules/audio_processing/audio_buffer.h"
 #include "modules/audio_processing/ns/noise_estimator.h"
 #include "modules/audio_processing/ns/ns_common.h"
 #include "modules/audio_processing/ns/ns_config.h"
 #include "modules/audio_processing/ns/ns_fft.h"
 #include "modules/audio_processing/ns/speech_probability_estimator.h"
 #include "modules/audio_processing/ns/wiener_filter.h"

 namespace webrtc {

 // Class for suppressing noise in a signal.
 class NoiseSuppressor {
  public:
   NoiseSuppressor(const NsConfig& config,
                   size_t sample_rate_hz,
                   size_t num_channels);
   NoiseSuppressor(const NoiseSuppressor&) = delete;
   NoiseSuppressor& operator=(const NoiseSuppressor&) = delete;

   // Analyses the signal (typically applied before the AEC to avoid analyzing
   // any comfort noise signal).
   void Analyze(const AudioBuffer& audio);

   // Applies noise suppression.
   void Process(AudioBuffer* audio);

   // Specifies whether the capture output will be used. The purpose of this is
   // to allow the noise suppressor to deactivate some of the processing when the
   // resulting output is anyway not used, for instance when the endpoint is
   // muted.
   void SetCaptureOutputUsage(bool capture_output_used) {
     capture_output_used_ = capture_output_used;
   }

  private:
   const size_t num_bands_;
   const size_t num_channels_;
   const SuppressionParams suppression_params_;
   int32_t num_analyzed_frames_ = -1;
   NrFft fft_;
   bool capture_output_used_ = true;

   struct ChannelState {
     ChannelState(const SuppressionParams& suppression_params, size_t num_bands);

     SpeechProbabilityEstimator speech_probability_estimator;
     WienerFilter wiener_filter;
     NoiseEstimator noise_estimator;
     std::array<float, kFftSizeBy2Plus1> prev_analysis_signal_spectrum;
     std::array<float, kFftSize - kNsFrameSize> analyze_analysis_memory;
     std::array<float, kOverlapSize> process_analysis_memory;
     std::array<float, kOverlapSize> process_synthesis_memory;
     std::vector<std::array<float, kOverlapSize>> process_delay_memory;
   };

   struct FilterBankState {
     std::array<float, kFftSize> real;
     std::array<float, kFftSize> imag;
     std::array<float, kFftSize> extended_frame;
   };

   std::vector<FilterBankState> filter_bank_states_heap_;
   std::vector<float> upper_band_gains_heap_;
   std::vector<float> energies_before_filtering_heap_;
   std::vector<float> gain_adjustments_heap_;
   std::vector<std::unique_ptr<ChannelState>> channels_;

   // Aggregates the Wiener filters into a single filter to use.
   void AggregateWienerFilters(
       rtc::ArrayView<float, kFftSizeBy2Plus1> filter) const;
 };

 }  // namespace webrtc

 #endif  // MODULES_AUDIO_PROCESSING_NS_NOISE_SUPPRESSOR_H_
	/*
	* Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
	*
	* Use of this source code is governed by a BSD-style license
	* that can be found in the LICENSE file in the root of the source
	* tree. An additional intellectual property rights grant can be found
	* in the file PATENTS. All contributing project authors may
	* be found in the AUTHORS file in the root of the source tree.
	*/

	#ifndef MODULES_AUDIO_PROCESSING_NS_NOISE_SUPPRESSOR_H_
	#define MODULES_AUDIO_PROCESSING_NS_NOISE_SUPPRESSOR_H_

	#include <memory>
	#include <vector>

	#include "api/array_view.h"
	#include "modules/audio_processing/audio_buffer.h"
	#include "modules/audio_processing/ns/noise_estimator.h"
	#include "modules/audio_processing/ns/ns_common.h"
	#include "modules/audio_processing/ns/ns_config.h"
	#include "modules/audio_processing/ns/ns_fft.h"
	#include "modules/audio_processing/ns/speech_probability_estimator.h"
	#include "modules/audio_processing/ns/wiener_filter.h"

	namespace webrtc {

	// Class for suppressing noise in a signal.
	class NoiseSuppressor {
	public:
	NoiseSuppressor(const NsConfig& config,
	size_t sample_rate_hz,
	size_t num_channels);
	NoiseSuppressor(const NoiseSuppressor&) = delete;
	NoiseSuppressor& operator=(const NoiseSuppressor&) = delete;

	// Analyses the signal (typically applied before the AEC to avoid analyzing
	// any comfort noise signal).
	void Analyze(const AudioBuffer& audio);

	// Applies noise suppression.
	void Process(AudioBuffer* audio);

	// Specifies whether the capture output will be used. The purpose of this is
	// to allow the noise suppressor to deactivate some of the processing when the
	// resulting output is anyway not used, for instance when the endpoint is
	// muted.
	void SetCaptureOutputUsage(bool capture_output_used) {
	capture_output_used_ = capture_output_used;
	}

	private:
	const size_t num_bands_;
	const size_t num_channels_;
	const SuppressionParams suppression_params_;
	int32_t num_analyzed_frames_ = -1;
	NrFft fft_;
	bool capture_output_used_ = true;

	struct ChannelState {
	ChannelState(const SuppressionParams& suppression_params, size_t num_bands);

	SpeechProbabilityEstimator speech_probability_estimator;
	WienerFilter wiener_filter;
	NoiseEstimator noise_estimator;
	std::array<float, kFftSizeBy2Plus1> prev_analysis_signal_spectrum;
	std::array<float, kFftSize - kNsFrameSize> analyze_analysis_memory;
	std::array<float, kOverlapSize> process_analysis_memory;
	std::array<float, kOverlapSize> process_synthesis_memory;
	std::vector<std::array<float, kOverlapSize>> process_delay_memory;
	};

	struct FilterBankState {
	std::array<float, kFftSize> real;
	std::array<float, kFftSize> imag;
	std::array<float, kFftSize> extended_frame;
	};

	std::vector<FilterBankState> filter_bank_states_heap_;
	std::vector<float> upper_band_gains_heap_;
	std::vector<float> energies_before_filtering_heap_;
	std::vector<float> gain_adjustments_heap_;
	std::vector<std::unique_ptr<ChannelState>> channels_;

	// Aggregates the Wiener filters into a single filter to use.
	void AggregateWienerFilters(
	rtc::ArrayView<float, kFftSizeBy2Plus1> filter) const;
	};

	} // namespace webrtc

	#endif // MODULES_AUDIO_PROCESSING_NS_NOISE_SUPPRESSOR_H_