api/audio/echo_canceller3_config.h - src/ - Git at Google

 /*
  *  Copyright (c) 2018 The WebRTC project authors. All Rights Reserved.
  *
  *  Use of this source code is governed by a BSD-style license
  *  that can be found in the LICENSE file in the root of the source
  *  tree. An additional intellectual property rights grant can be found
  *  in the file PATENTS.  All contributing project authors may
  *  be found in the AUTHORS file in the root of the source tree.
  */

 #ifndef API_AUDIO_ECHO_CANCELLER3_CONFIG_H_
 #define API_AUDIO_ECHO_CANCELLER3_CONFIG_H_

 #include <stddef.h>  // size_t

 #include "rtc_base/system/rtc_export.h"

 namespace webrtc {

 // Configuration struct for EchoCanceller3
 struct RTC_EXPORT EchoCanceller3Config {
   // Checks and updates the config parameters to lie within (mostly) reasonable
   // ranges. Returns true if and only of the config did not need to be changed.
   static bool Validate(EchoCanceller3Config* config);

   EchoCanceller3Config();
   EchoCanceller3Config(const EchoCanceller3Config& e);
   EchoCanceller3Config& operator=(const EchoCanceller3Config& other);

   struct Buffering {
     size_t excess_render_detection_interval_blocks = 250;
     size_t max_allowed_excess_render_blocks = 8;
   } buffering;

   struct Delay {
     Delay();
     Delay(const Delay& e);
     Delay& operator=(const Delay& e);
     size_t default_delay = 5;
     size_t down_sampling_factor = 4;
     size_t num_filters = 5;
     size_t delay_headroom_samples = 32;
     size_t hysteresis_limit_blocks = 1;
     size_t fixed_capture_delay_samples = 0;
     float delay_estimate_smoothing = 0.7f;
     float delay_estimate_smoothing_delay_found = 0.7f;
     float delay_candidate_detection_threshold = 0.2f;
     struct DelaySelectionThresholds {
       int initial;
       int converged;
     } delay_selection_thresholds = {5, 20};
     bool use_external_delay_estimator = false;
     bool log_warning_on_delay_changes = false;
     struct AlignmentMixing {
       bool downmix;
       bool adaptive_selection;
       float activity_power_threshold;
       bool prefer_first_two_channels;
     };
     AlignmentMixing render_alignment_mixing = {false, true, 10000.f, true};
     AlignmentMixing capture_alignment_mixing = {false, true, 10000.f, false};
     bool detect_pre_echo = true;
   } delay;

   struct Filter {
     struct RefinedConfiguration {
       size_t length_blocks;
       float leakage_converged;
       float leakage_diverged;
       float error_floor;
       float error_ceil;
       float noise_gate;
     };

     struct CoarseConfiguration {
       size_t length_blocks;
       float rate;
       float noise_gate;
     };

     RefinedConfiguration refined = {13,     0.00005f, 0.05f,
                                     0.001f, 2.f,      20075344.f};
     CoarseConfiguration coarse = {13, 0.7f, 20075344.f};

     RefinedConfiguration refined_initial = {12,     0.005f, 0.5f,
                                             0.001f, 2.f,    20075344.f};
     CoarseConfiguration coarse_initial = {12, 0.9f, 20075344.f};

     size_t config_change_duration_blocks = 250;
     float initial_state_seconds = 2.5f;
     int coarse_reset_hangover_blocks = 25;
     bool conservative_initial_phase = false;
     bool enable_coarse_filter_output_usage = true;
     bool use_linear_filter = true;
     bool high_pass_filter_echo_reference = false;
     bool export_linear_aec_output = false;
   } filter;

   struct Erle {
     float min = 1.f;
     float max_l = 4.f;
     float max_h = 1.5f;
     bool onset_detection = true;
     size_t num_sections = 1;
     bool clamp_quality_estimate_to_zero = true;
     bool clamp_quality_estimate_to_one = true;
   } erle;

   struct EpStrength {
     float default_gain = 1.f;
     float default_len = 0.83f;
     float nearend_len = 0.83f;
     bool echo_can_saturate = true;
     bool bounded_erl = false;
     bool erle_onset_compensation_in_dominant_nearend = false;
     bool use_conservative_tail_frequency_response = true;
   } ep_strength;

   struct EchoAudibility {
     float low_render_limit = 4 * 64.f;
     float normal_render_limit = 64.f;
     float floor_power = 2 * 64.f;
     float audibility_threshold_lf = 10;
     float audibility_threshold_mf = 10;
     float audibility_threshold_hf = 10;
     bool use_stationarity_properties = false;
     bool use_stationarity_properties_at_init = false;
   } echo_audibility;

   struct RenderLevels {
     float active_render_limit = 100.f;
     float poor_excitation_render_limit = 150.f;
     float poor_excitation_render_limit_ds8 = 20.f;
     float render_power_gain_db = 0.f;
   } render_levels;

   struct EchoRemovalControl {
     bool has_clock_drift = false;
     bool linear_and_stable_echo_path = false;
   } echo_removal_control;

   struct EchoModel {
     EchoModel();
     EchoModel(const EchoModel& e);
     EchoModel& operator=(const EchoModel& e);
     size_t noise_floor_hold = 50;
     float min_noise_floor_power = 1638400.f;
     float stationary_gate_slope = 10.f;
     float noise_gate_power = 27509.42f;
     float noise_gate_slope = 0.3f;
     size_t render_pre_window_size = 1;
     size_t render_post_window_size = 1;
     bool model_reverb_in_nonlinear_mode = true;
   } echo_model;

   struct ComfortNoise {
     float noise_floor_dbfs = -96.03406f;
   } comfort_noise;

   struct Suppressor {
     Suppressor();
     Suppressor(const Suppressor& e);
     Suppressor& operator=(const Suppressor& e);

     size_t nearend_average_blocks = 4;

     struct MaskingThresholds {
       MaskingThresholds(float enr_transparent,
                         float enr_suppress,
                         float emr_transparent);
       MaskingThresholds(const MaskingThresholds& e);
       MaskingThresholds& operator=(const MaskingThresholds& e);
       float enr_transparent;
       float enr_suppress;
       float emr_transparent;
     };

     struct Tuning {
       Tuning(MaskingThresholds mask_lf,
              MaskingThresholds mask_hf,
              float max_inc_factor,
              float max_dec_factor_lf);
       Tuning(const Tuning& e);
       Tuning& operator=(const Tuning& e);
       MaskingThresholds mask_lf;
       MaskingThresholds mask_hf;
       float max_inc_factor;
       float max_dec_factor_lf;
     };

     Tuning normal_tuning = Tuning(MaskingThresholds(.3f, .4f, .3f),
                                   MaskingThresholds(.07f, .1f, .3f),
                                   2.0f,
                                   0.25f);
     Tuning nearend_tuning = Tuning(MaskingThresholds(1.09f, 1.1f, .3f),
                                    MaskingThresholds(.1f, .3f, .3f),
                                    2.0f,
                                    0.25f);

     bool lf_smoothing_during_initial_phase = true;
     int last_permanent_lf_smoothing_band = 0;
     int last_lf_smoothing_band = 5;
     int last_lf_band = 5;
     int first_hf_band = 8;

     struct DominantNearendDetection {
       float enr_threshold = .25f;
       float enr_exit_threshold = 10.f;
       float snr_threshold = 30.f;
       int hold_duration = 50;
       int trigger_threshold = 12;
       bool use_during_initial_phase = true;
       bool use_unbounded_echo_spectrum = true;
     } dominant_nearend_detection;

     struct SubbandNearendDetection {
       size_t nearend_average_blocks = 1;
       struct SubbandRegion {
         size_t low;
         size_t high;
       };
       SubbandRegion subband1 = {1, 1};
       SubbandRegion subband2 = {1, 1};
       float nearend_threshold = 1.f;
       float snr_threshold = 1.f;
     } subband_nearend_detection;

     bool use_subband_nearend_detection = false;

     struct HighBandsSuppression {
       float enr_threshold = 1.f;
       float max_gain_during_echo = 1.f;
       float anti_howling_activation_threshold = 400.f;
       float anti_howling_gain = 1.f;
     } high_bands_suppression;

     float floor_first_increase = 0.00001f;
     bool conservative_hf_suppression = false;
   } suppressor;

   struct MultiChannel {
     bool detect_stereo_content = true;
     float stereo_detection_threshold = 0.0f;
     int stereo_detection_timeout_threshold_seconds = 300;
     float stereo_detection_hysteresis_seconds = 2.0f;
   } multi_channel;
 };
 }  // namespace webrtc

 #endif  // API_AUDIO_ECHO_CANCELLER3_CONFIG_H_
	/*
	* Copyright (c) 2018 The WebRTC project authors. All Rights Reserved.
	*
	* Use of this source code is governed by a BSD-style license
	* that can be found in the LICENSE file in the root of the source
	* tree. An additional intellectual property rights grant can be found
	* in the file PATENTS. All contributing project authors may
	* be found in the AUTHORS file in the root of the source tree.
	*/

	#ifndef API_AUDIO_ECHO_CANCELLER3_CONFIG_H_
	#define API_AUDIO_ECHO_CANCELLER3_CONFIG_H_

	#include <stddef.h> // size_t

	#include "rtc_base/system/rtc_export.h"

	namespace webrtc {

	// Configuration struct for EchoCanceller3
	struct RTC_EXPORT EchoCanceller3Config {
	// Checks and updates the config parameters to lie within (mostly) reasonable
	// ranges. Returns true if and only of the config did not need to be changed.
	static bool Validate(EchoCanceller3Config* config);

	EchoCanceller3Config();
	EchoCanceller3Config(const EchoCanceller3Config& e);
	EchoCanceller3Config& operator=(const EchoCanceller3Config& other);

	struct Buffering {
	size_t excess_render_detection_interval_blocks = 250;
	size_t max_allowed_excess_render_blocks = 8;
	} buffering;

	struct Delay {
	Delay();
	Delay(const Delay& e);
	Delay& operator=(const Delay& e);
	size_t default_delay = 5;
	size_t down_sampling_factor = 4;
	size_t num_filters = 5;
	size_t delay_headroom_samples = 32;
	size_t hysteresis_limit_blocks = 1;
	size_t fixed_capture_delay_samples = 0;
	float delay_estimate_smoothing = 0.7f;
	float delay_estimate_smoothing_delay_found = 0.7f;
	float delay_candidate_detection_threshold = 0.2f;
	struct DelaySelectionThresholds {
	int initial;
	int converged;
	} delay_selection_thresholds = {5, 20};
	bool use_external_delay_estimator = false;
	bool log_warning_on_delay_changes = false;
	struct AlignmentMixing {
	bool downmix;
	bool adaptive_selection;
	float activity_power_threshold;
	bool prefer_first_two_channels;
	};
	AlignmentMixing render_alignment_mixing = {false, true, 10000.f, true};
	AlignmentMixing capture_alignment_mixing = {false, true, 10000.f, false};
	bool detect_pre_echo = true;
	} delay;

	struct Filter {
	struct RefinedConfiguration {
	size_t length_blocks;
	float leakage_converged;
	float leakage_diverged;
	float error_floor;
	float error_ceil;
	float noise_gate;
	};

	struct CoarseConfiguration {
	size_t length_blocks;
	float rate;
	float noise_gate;
	};

	RefinedConfiguration refined = {13, 0.00005f, 0.05f,
	0.001f, 2.f, 20075344.f};
	CoarseConfiguration coarse = {13, 0.7f, 20075344.f};

	RefinedConfiguration refined_initial = {12, 0.005f, 0.5f,
	0.001f, 2.f, 20075344.f};
	CoarseConfiguration coarse_initial = {12, 0.9f, 20075344.f};

	size_t config_change_duration_blocks = 250;
	float initial_state_seconds = 2.5f;
	int coarse_reset_hangover_blocks = 25;
	bool conservative_initial_phase = false;
	bool enable_coarse_filter_output_usage = true;
	bool use_linear_filter = true;
	bool high_pass_filter_echo_reference = false;
	bool export_linear_aec_output = false;
	} filter;

	struct Erle {
	float min = 1.f;
	float max_l = 4.f;
	float max_h = 1.5f;
	bool onset_detection = true;
	size_t num_sections = 1;
	bool clamp_quality_estimate_to_zero = true;
	bool clamp_quality_estimate_to_one = true;
	} erle;

	struct EpStrength {
	float default_gain = 1.f;
	float default_len = 0.83f;
	float nearend_len = 0.83f;
	bool echo_can_saturate = true;
	bool bounded_erl = false;
	bool erle_onset_compensation_in_dominant_nearend = false;
	bool use_conservative_tail_frequency_response = true;
	} ep_strength;

	struct EchoAudibility {
	float low_render_limit = 4 * 64.f;
	float normal_render_limit = 64.f;
	float floor_power = 2 * 64.f;
	float audibility_threshold_lf = 10;
	float audibility_threshold_mf = 10;
	float audibility_threshold_hf = 10;
	bool use_stationarity_properties = false;
	bool use_stationarity_properties_at_init = false;
	} echo_audibility;

	struct RenderLevels {
	float active_render_limit = 100.f;
	float poor_excitation_render_limit = 150.f;
	float poor_excitation_render_limit_ds8 = 20.f;
	float render_power_gain_db = 0.f;
	} render_levels;

	struct EchoRemovalControl {
	bool has_clock_drift = false;
	bool linear_and_stable_echo_path = false;
	} echo_removal_control;

	struct EchoModel {
	EchoModel();
	EchoModel(const EchoModel& e);
	EchoModel& operator=(const EchoModel& e);
	size_t noise_floor_hold = 50;
	float min_noise_floor_power = 1638400.f;
	float stationary_gate_slope = 10.f;
	float noise_gate_power = 27509.42f;
	float noise_gate_slope = 0.3f;
	size_t render_pre_window_size = 1;
	size_t render_post_window_size = 1;
	bool model_reverb_in_nonlinear_mode = true;
	} echo_model;

	struct ComfortNoise {
	float noise_floor_dbfs = -96.03406f;
	} comfort_noise;

	struct Suppressor {
	Suppressor();
	Suppressor(const Suppressor& e);
	Suppressor& operator=(const Suppressor& e);

	size_t nearend_average_blocks = 4;

	struct MaskingThresholds {
	MaskingThresholds(float enr_transparent,
	float enr_suppress,
	float emr_transparent);
	MaskingThresholds(const MaskingThresholds& e);
	MaskingThresholds& operator=(const MaskingThresholds& e);
	float enr_transparent;
	float enr_suppress;
	float emr_transparent;
	};

	struct Tuning {
	Tuning(MaskingThresholds mask_lf,
	MaskingThresholds mask_hf,
	float max_inc_factor,
	float max_dec_factor_lf);
	Tuning(const Tuning& e);
	Tuning& operator=(const Tuning& e);
	MaskingThresholds mask_lf;
	MaskingThresholds mask_hf;
	float max_inc_factor;
	float max_dec_factor_lf;
	};

	Tuning normal_tuning = Tuning(MaskingThresholds(.3f, .4f, .3f),
	MaskingThresholds(.07f, .1f, .3f),
	2.0f,
	0.25f);
	Tuning nearend_tuning = Tuning(MaskingThresholds(1.09f, 1.1f, .3f),
	MaskingThresholds(.1f, .3f, .3f),
	2.0f,
	0.25f);

	bool lf_smoothing_during_initial_phase = true;
	int last_permanent_lf_smoothing_band = 0;
	int last_lf_smoothing_band = 5;
	int last_lf_band = 5;
	int first_hf_band = 8;

	struct DominantNearendDetection {
	float enr_threshold = .25f;
	float enr_exit_threshold = 10.f;
	float snr_threshold = 30.f;
	int hold_duration = 50;
	int trigger_threshold = 12;
	bool use_during_initial_phase = true;
	bool use_unbounded_echo_spectrum = true;
	} dominant_nearend_detection;

	struct SubbandNearendDetection {
	size_t nearend_average_blocks = 1;
	struct SubbandRegion {
	size_t low;
	size_t high;
	};
	SubbandRegion subband1 = {1, 1};
	SubbandRegion subband2 = {1, 1};
	float nearend_threshold = 1.f;
	float snr_threshold = 1.f;
	} subband_nearend_detection;

	bool use_subband_nearend_detection = false;

	struct HighBandsSuppression {
	float enr_threshold = 1.f;
	float max_gain_during_echo = 1.f;
	float anti_howling_activation_threshold = 400.f;
	float anti_howling_gain = 1.f;
	} high_bands_suppression;

	float floor_first_increase = 0.00001f;
	bool conservative_hf_suppression = false;
	} suppressor;

	struct MultiChannel {
	bool detect_stereo_content = true;
	float stereo_detection_threshold = 0.0f;
	int stereo_detection_timeout_threshold_seconds = 300;
	float stereo_detection_hysteresis_seconds = 2.0f;
	} multi_channel;
	};
	} // namespace webrtc

	#endif // API_AUDIO_ECHO_CANCELLER3_CONFIG_H_