| /* |
| * Copyright (c) 2018 The WebRTC project authors. All Rights Reserved. |
| * |
| * Use of this source code is governed by a BSD-style license |
| * that can be found in the LICENSE file in the root of the source |
| * tree. An additional intellectual property rights grant can be found |
| * in the file PATENTS. All contributing project authors may |
| * be found in the AUTHORS file in the root of the source tree. |
| */ |
| |
| #ifndef API_AUDIO_ECHO_CANCELLER3_CONFIG_H_ |
| #define API_AUDIO_ECHO_CANCELLER3_CONFIG_H_ |
| |
| #include <stddef.h> // size_t |
| |
| #include "rtc_base/system/rtc_export.h" |
| |
| namespace webrtc { |
| |
| // Configuration struct for EchoCanceller3 |
| struct RTC_EXPORT EchoCanceller3Config { |
| // Checks and updates the config parameters to lie within (mostly) reasonable |
| // ranges. Returns true if and only of the config did not need to be changed. |
| static bool Validate(EchoCanceller3Config* config); |
| |
| EchoCanceller3Config(); |
| EchoCanceller3Config(const EchoCanceller3Config& e); |
| EchoCanceller3Config& operator=(const EchoCanceller3Config& other); |
| |
| struct Buffering { |
| size_t excess_render_detection_interval_blocks = 250; |
| size_t max_allowed_excess_render_blocks = 8; |
| } buffering; |
| |
| struct Delay { |
| Delay(); |
| Delay(const Delay& e); |
| Delay& operator=(const Delay& e); |
| size_t default_delay = 5; |
| size_t down_sampling_factor = 4; |
| size_t num_filters = 5; |
| size_t delay_headroom_samples = 32; |
| size_t hysteresis_limit_blocks = 1; |
| size_t fixed_capture_delay_samples = 0; |
| float delay_estimate_smoothing = 0.7f; |
| float delay_estimate_smoothing_delay_found = 0.7f; |
| float delay_candidate_detection_threshold = 0.2f; |
| struct DelaySelectionThresholds { |
| int initial; |
| int converged; |
| } delay_selection_thresholds = {5, 20}; |
| bool use_external_delay_estimator = false; |
| bool log_warning_on_delay_changes = false; |
| struct AlignmentMixing { |
| bool downmix; |
| bool adaptive_selection; |
| float activity_power_threshold; |
| bool prefer_first_two_channels; |
| }; |
| AlignmentMixing render_alignment_mixing = {false, true, 10000.f, true}; |
| AlignmentMixing capture_alignment_mixing = {false, true, 10000.f, false}; |
| bool detect_pre_echo = true; |
| } delay; |
| |
| struct Filter { |
| struct RefinedConfiguration { |
| size_t length_blocks; |
| float leakage_converged; |
| float leakage_diverged; |
| float error_floor; |
| float error_ceil; |
| float noise_gate; |
| }; |
| |
| struct CoarseConfiguration { |
| size_t length_blocks; |
| float rate; |
| float noise_gate; |
| }; |
| |
| RefinedConfiguration refined = {13, 0.00005f, 0.05f, |
| 0.001f, 2.f, 20075344.f}; |
| CoarseConfiguration coarse = {13, 0.7f, 20075344.f}; |
| |
| RefinedConfiguration refined_initial = {12, 0.005f, 0.5f, |
| 0.001f, 2.f, 20075344.f}; |
| CoarseConfiguration coarse_initial = {12, 0.9f, 20075344.f}; |
| |
| size_t config_change_duration_blocks = 250; |
| float initial_state_seconds = 2.5f; |
| int coarse_reset_hangover_blocks = 25; |
| bool conservative_initial_phase = false; |
| bool enable_coarse_filter_output_usage = true; |
| bool use_linear_filter = true; |
| bool high_pass_filter_echo_reference = false; |
| bool export_linear_aec_output = false; |
| } filter; |
| |
| struct Erle { |
| float min = 1.f; |
| float max_l = 4.f; |
| float max_h = 1.5f; |
| bool onset_detection = true; |
| size_t num_sections = 1; |
| bool clamp_quality_estimate_to_zero = true; |
| bool clamp_quality_estimate_to_one = true; |
| } erle; |
| |
| struct EpStrength { |
| float default_gain = 1.f; |
| float default_len = 0.83f; |
| float nearend_len = 0.83f; |
| bool echo_can_saturate = true; |
| bool bounded_erl = false; |
| bool erle_onset_compensation_in_dominant_nearend = false; |
| bool use_conservative_tail_frequency_response = true; |
| } ep_strength; |
| |
| struct EchoAudibility { |
| float low_render_limit = 4 * 64.f; |
| float normal_render_limit = 64.f; |
| float floor_power = 2 * 64.f; |
| float audibility_threshold_lf = 10; |
| float audibility_threshold_mf = 10; |
| float audibility_threshold_hf = 10; |
| bool use_stationarity_properties = false; |
| bool use_stationarity_properties_at_init = false; |
| } echo_audibility; |
| |
| struct RenderLevels { |
| float active_render_limit = 100.f; |
| float poor_excitation_render_limit = 150.f; |
| float poor_excitation_render_limit_ds8 = 20.f; |
| float render_power_gain_db = 0.f; |
| } render_levels; |
| |
| struct EchoRemovalControl { |
| bool has_clock_drift = false; |
| bool linear_and_stable_echo_path = false; |
| } echo_removal_control; |
| |
| struct EchoModel { |
| EchoModel(); |
| EchoModel(const EchoModel& e); |
| EchoModel& operator=(const EchoModel& e); |
| size_t noise_floor_hold = 50; |
| float min_noise_floor_power = 1638400.f; |
| float stationary_gate_slope = 10.f; |
| float noise_gate_power = 27509.42f; |
| float noise_gate_slope = 0.3f; |
| size_t render_pre_window_size = 1; |
| size_t render_post_window_size = 1; |
| bool model_reverb_in_nonlinear_mode = true; |
| } echo_model; |
| |
| struct ComfortNoise { |
| float noise_floor_dbfs = -96.03406f; |
| } comfort_noise; |
| |
| struct Suppressor { |
| Suppressor(); |
| Suppressor(const Suppressor& e); |
| Suppressor& operator=(const Suppressor& e); |
| |
| size_t nearend_average_blocks = 4; |
| |
| struct MaskingThresholds { |
| MaskingThresholds(float enr_transparent, |
| float enr_suppress, |
| float emr_transparent); |
| MaskingThresholds(const MaskingThresholds& e); |
| MaskingThresholds& operator=(const MaskingThresholds& e); |
| float enr_transparent; |
| float enr_suppress; |
| float emr_transparent; |
| }; |
| |
| struct Tuning { |
| Tuning(MaskingThresholds mask_lf, |
| MaskingThresholds mask_hf, |
| float max_inc_factor, |
| float max_dec_factor_lf); |
| Tuning(const Tuning& e); |
| Tuning& operator=(const Tuning& e); |
| MaskingThresholds mask_lf; |
| MaskingThresholds mask_hf; |
| float max_inc_factor; |
| float max_dec_factor_lf; |
| }; |
| |
| Tuning normal_tuning = Tuning(MaskingThresholds(.3f, .4f, .3f), |
| MaskingThresholds(.07f, .1f, .3f), |
| 2.0f, |
| 0.25f); |
| Tuning nearend_tuning = Tuning(MaskingThresholds(1.09f, 1.1f, .3f), |
| MaskingThresholds(.1f, .3f, .3f), |
| 2.0f, |
| 0.25f); |
| |
| bool lf_smoothing_during_initial_phase = true; |
| int last_permanent_lf_smoothing_band = 0; |
| int last_lf_smoothing_band = 5; |
| int last_lf_band = 5; |
| int first_hf_band = 8; |
| |
| struct DominantNearendDetection { |
| float enr_threshold = .25f; |
| float enr_exit_threshold = 10.f; |
| float snr_threshold = 30.f; |
| int hold_duration = 50; |
| int trigger_threshold = 12; |
| bool use_during_initial_phase = true; |
| bool use_unbounded_echo_spectrum = true; |
| } dominant_nearend_detection; |
| |
| struct SubbandNearendDetection { |
| size_t nearend_average_blocks = 1; |
| struct SubbandRegion { |
| size_t low; |
| size_t high; |
| }; |
| SubbandRegion subband1 = {1, 1}; |
| SubbandRegion subband2 = {1, 1}; |
| float nearend_threshold = 1.f; |
| float snr_threshold = 1.f; |
| } subband_nearend_detection; |
| |
| bool use_subband_nearend_detection = false; |
| |
| struct HighBandsSuppression { |
| float enr_threshold = 1.f; |
| float max_gain_during_echo = 1.f; |
| float anti_howling_activation_threshold = 400.f; |
| float anti_howling_gain = 1.f; |
| } high_bands_suppression; |
| |
| float floor_first_increase = 0.00001f; |
| bool conservative_hf_suppression = false; |
| } suppressor; |
| |
| struct MultiChannel { |
| bool detect_stereo_content = true; |
| float stereo_detection_threshold = 0.0f; |
| int stereo_detection_timeout_threshold_seconds = 300; |
| float stereo_detection_hysteresis_seconds = 2.0f; |
| } multi_channel; |
| }; |
| } // namespace webrtc |
| |
| #endif // API_AUDIO_ECHO_CANCELLER3_CONFIG_H_ |