/* * Copyright (c) 2018 The WebRTC project authors. All Rights Reserved. * * Use of this source code is governed by a BSD-style license * that can be found in the LICENSE file in the root of the source * tree. An additional intellectual property rights grant can be found * in the file PATENTS. All contributing project authors may * be found in the AUTHORS file in the root of the source tree. */ #ifndef API_AUDIO_ECHO_CANCELLER3_CONFIG_H_ #define API_AUDIO_ECHO_CANCELLER3_CONFIG_H_ #include // size_t #include "rtc_base/system/rtc_export.h" namespace webrtc { // Configuration struct for EchoCanceller3 struct RTC_EXPORT EchoCanceller3Config { // Checks and updates the config parameters to lie within (mostly) reasonable // ranges. Returns true if and only of the config did not need to be changed. static bool Validate(EchoCanceller3Config* config); EchoCanceller3Config(); EchoCanceller3Config(const EchoCanceller3Config& e); EchoCanceller3Config& operator=(const EchoCanceller3Config& other); struct Buffering { size_t excess_render_detection_interval_blocks = 250; size_t max_allowed_excess_render_blocks = 8; } buffering; struct Delay { Delay(); Delay(const Delay& e); Delay& operator=(const Delay& e); size_t default_delay = 5; size_t down_sampling_factor = 4; size_t num_filters = 5; size_t delay_headroom_samples = 32; size_t hysteresis_limit_blocks = 1; size_t fixed_capture_delay_samples = 0; float delay_estimate_smoothing = 0.7f; float delay_candidate_detection_threshold = 0.2f; struct DelaySelectionThresholds { int initial; int converged; } delay_selection_thresholds = {5, 20}; bool use_external_delay_estimator = false; bool log_warning_on_delay_changes = false; struct AlignmentMixing { bool downmix; bool adaptive_selection; float activity_power_threshold; bool prefer_first_two_channels; }; AlignmentMixing render_alignment_mixing = {false, true, 10000.f, true}; AlignmentMixing capture_alignment_mixing = {false, true, 10000.f, false}; } delay; struct Filter { struct RefinedConfiguration { size_t length_blocks; float leakage_converged; float leakage_diverged; float error_floor; float error_ceil; float noise_gate; }; struct CoarseConfiguration { size_t length_blocks; float rate; float noise_gate; }; RefinedConfiguration refined = {13, 0.00005f, 0.05f, 0.001f, 2.f, 20075344.f}; CoarseConfiguration coarse = {13, 0.7f, 20075344.f}; RefinedConfiguration refined_initial = {12, 0.005f, 0.5f, 0.001f, 2.f, 20075344.f}; CoarseConfiguration coarse_initial = {12, 0.9f, 20075344.f}; size_t config_change_duration_blocks = 250; float initial_state_seconds = 2.5f; bool conservative_initial_phase = false; bool enable_coarse_filter_output_usage = true; bool use_linear_filter = true; bool export_linear_aec_output = false; } filter; struct Erle { float min = 1.f; float max_l = 4.f; float max_h = 1.5f; bool onset_detection = true; size_t num_sections = 1; bool clamp_quality_estimate_to_zero = true; bool clamp_quality_estimate_to_one = true; } erle; struct EpStrength { float default_gain = 1.f; float default_len = 0.83f; bool echo_can_saturate = true; bool bounded_erl = false; } ep_strength; struct EchoAudibility { float low_render_limit = 4 * 64.f; float normal_render_limit = 64.f; float floor_power = 2 * 64.f; float audibility_threshold_lf = 10; float audibility_threshold_mf = 10; float audibility_threshold_hf = 10; bool use_stationarity_properties = false; bool use_stationarity_properties_at_init = false; } echo_audibility; struct RenderLevels { float active_render_limit = 100.f; float poor_excitation_render_limit = 150.f; float poor_excitation_render_limit_ds8 = 20.f; float render_power_gain_db = 0.f; } render_levels; struct EchoRemovalControl { bool has_clock_drift = false; bool linear_and_stable_echo_path = false; } echo_removal_control; struct EchoModel { EchoModel(); EchoModel(const EchoModel& e); EchoModel& operator=(const EchoModel& e); size_t noise_floor_hold = 50; float min_noise_floor_power = 1638400.f; float stationary_gate_slope = 10.f; float noise_gate_power = 27509.42f; float noise_gate_slope = 0.3f; size_t render_pre_window_size = 1; size_t render_post_window_size = 1; } echo_model; struct ComfortNoise { float noise_floor_dbfs = -96.03406f; } comfort_noise; struct Suppressor { Suppressor(); Suppressor(const Suppressor& e); Suppressor& operator=(const Suppressor& e); size_t nearend_average_blocks = 4; struct MaskingThresholds { MaskingThresholds(float enr_transparent, float enr_suppress, float emr_transparent); MaskingThresholds(const MaskingThresholds& e); MaskingThresholds& operator=(const MaskingThresholds& e); float enr_transparent; float enr_suppress; float emr_transparent; }; struct Tuning { Tuning(MaskingThresholds mask_lf, MaskingThresholds mask_hf, float max_inc_factor, float max_dec_factor_lf); Tuning(const Tuning& e); Tuning& operator=(const Tuning& e); MaskingThresholds mask_lf; MaskingThresholds mask_hf; float max_inc_factor; float max_dec_factor_lf; }; Tuning normal_tuning = Tuning(MaskingThresholds(.3f, .4f, .3f), MaskingThresholds(.07f, .1f, .3f), 2.0f, 0.25f); Tuning nearend_tuning = Tuning(MaskingThresholds(1.09f, 1.1f, .3f), MaskingThresholds(.1f, .3f, .3f), 2.0f, 0.25f); struct DominantNearendDetection { float enr_threshold = .25f; float enr_exit_threshold = 10.f; float snr_threshold = 30.f; int hold_duration = 50; int trigger_threshold = 12; bool use_during_initial_phase = true; } dominant_nearend_detection; struct SubbandNearendDetection { size_t nearend_average_blocks = 1; struct SubbandRegion { size_t low; size_t high; }; SubbandRegion subband1 = {1, 1}; SubbandRegion subband2 = {1, 1}; float nearend_threshold = 1.f; float snr_threshold = 1.f; } subband_nearend_detection; bool use_subband_nearend_detection = false; struct HighBandsSuppression { float enr_threshold = 1.f; float max_gain_during_echo = 1.f; float anti_howling_activation_threshold = 400.f; float anti_howling_gain = 1.f; } high_bands_suppression; float floor_first_increase = 0.00001f; } suppressor; }; } // namespace webrtc #endif // API_AUDIO_ECHO_CANCELLER3_CONFIG_H_