You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
228 lines
7.0 KiB
228 lines
7.0 KiB
/*
|
|
* Copyright (c) 2018 The WebRTC project authors. All Rights Reserved.
|
|
*
|
|
* Use of this source code is governed by a BSD-style license
|
|
* that can be found in the LICENSE file in the root of the source
|
|
* tree. An additional intellectual property rights grant can be found
|
|
* in the file PATENTS. All contributing project authors may
|
|
* be found in the AUTHORS file in the root of the source tree.
|
|
*/
|
|
|
|
#ifndef API_AUDIO_ECHO_CANCELLER3_CONFIG_H_
|
|
#define API_AUDIO_ECHO_CANCELLER3_CONFIG_H_
|
|
|
|
#include <stddef.h> // size_t
|
|
|
|
#include "rtc_base/system/rtc_export.h"
|
|
|
|
namespace webrtc {
|
|
|
|
// Configuration struct for EchoCanceller3
|
|
struct RTC_EXPORT EchoCanceller3Config {
|
|
// Checks and updates the config parameters to lie within (mostly) reasonable
|
|
// ranges. Returns true if and only of the config did not need to be changed.
|
|
static bool Validate(EchoCanceller3Config* config);
|
|
|
|
EchoCanceller3Config();
|
|
EchoCanceller3Config(const EchoCanceller3Config& e);
|
|
EchoCanceller3Config& operator=(const EchoCanceller3Config& other);
|
|
|
|
struct Buffering {
|
|
size_t excess_render_detection_interval_blocks = 250;
|
|
size_t max_allowed_excess_render_blocks = 8;
|
|
} buffering;
|
|
|
|
struct Delay {
|
|
Delay();
|
|
Delay(const Delay& e);
|
|
Delay& operator=(const Delay& e);
|
|
size_t default_delay = 5;
|
|
size_t down_sampling_factor = 4;
|
|
size_t num_filters = 5;
|
|
size_t delay_headroom_samples = 32;
|
|
size_t hysteresis_limit_blocks = 1;
|
|
size_t fixed_capture_delay_samples = 0;
|
|
float delay_estimate_smoothing = 0.7f;
|
|
float delay_candidate_detection_threshold = 0.2f;
|
|
struct DelaySelectionThresholds {
|
|
int initial;
|
|
int converged;
|
|
} delay_selection_thresholds = {5, 20};
|
|
bool use_external_delay_estimator = false;
|
|
bool log_warning_on_delay_changes = false;
|
|
struct AlignmentMixing {
|
|
bool downmix;
|
|
bool adaptive_selection;
|
|
float activity_power_threshold;
|
|
bool prefer_first_two_channels;
|
|
};
|
|
AlignmentMixing render_alignment_mixing = {false, true, 10000.f, true};
|
|
AlignmentMixing capture_alignment_mixing = {false, true, 10000.f, false};
|
|
} delay;
|
|
|
|
struct Filter {
|
|
struct RefinedConfiguration {
|
|
size_t length_blocks;
|
|
float leakage_converged;
|
|
float leakage_diverged;
|
|
float error_floor;
|
|
float error_ceil;
|
|
float noise_gate;
|
|
};
|
|
|
|
struct CoarseConfiguration {
|
|
size_t length_blocks;
|
|
float rate;
|
|
float noise_gate;
|
|
};
|
|
|
|
RefinedConfiguration refined = {13, 0.00005f, 0.05f,
|
|
0.001f, 2.f, 20075344.f};
|
|
CoarseConfiguration coarse = {13, 0.7f, 20075344.f};
|
|
|
|
RefinedConfiguration refined_initial = {12, 0.005f, 0.5f,
|
|
0.001f, 2.f, 20075344.f};
|
|
CoarseConfiguration coarse_initial = {12, 0.9f, 20075344.f};
|
|
|
|
size_t config_change_duration_blocks = 250;
|
|
float initial_state_seconds = 2.5f;
|
|
bool conservative_initial_phase = false;
|
|
bool enable_coarse_filter_output_usage = true;
|
|
bool use_linear_filter = true;
|
|
bool export_linear_aec_output = false;
|
|
} filter;
|
|
|
|
struct Erle {
|
|
float min = 1.f;
|
|
float max_l = 4.f;
|
|
float max_h = 1.5f;
|
|
bool onset_detection = true;
|
|
size_t num_sections = 1;
|
|
bool clamp_quality_estimate_to_zero = true;
|
|
bool clamp_quality_estimate_to_one = true;
|
|
} erle;
|
|
|
|
struct EpStrength {
|
|
float default_gain = 1.f;
|
|
float default_len = 0.83f;
|
|
bool echo_can_saturate = true;
|
|
bool bounded_erl = false;
|
|
} ep_strength;
|
|
|
|
struct EchoAudibility {
|
|
float low_render_limit = 4 * 64.f;
|
|
float normal_render_limit = 64.f;
|
|
float floor_power = 2 * 64.f;
|
|
float audibility_threshold_lf = 10;
|
|
float audibility_threshold_mf = 10;
|
|
float audibility_threshold_hf = 10;
|
|
bool use_stationarity_properties = false;
|
|
bool use_stationarity_properties_at_init = false;
|
|
} echo_audibility;
|
|
|
|
struct RenderLevels {
|
|
float active_render_limit = 100.f;
|
|
float poor_excitation_render_limit = 150.f;
|
|
float poor_excitation_render_limit_ds8 = 20.f;
|
|
float render_power_gain_db = 0.f;
|
|
} render_levels;
|
|
|
|
struct EchoRemovalControl {
|
|
bool has_clock_drift = false;
|
|
bool linear_and_stable_echo_path = false;
|
|
} echo_removal_control;
|
|
|
|
struct EchoModel {
|
|
EchoModel();
|
|
EchoModel(const EchoModel& e);
|
|
EchoModel& operator=(const EchoModel& e);
|
|
size_t noise_floor_hold = 50;
|
|
float min_noise_floor_power = 1638400.f;
|
|
float stationary_gate_slope = 10.f;
|
|
float noise_gate_power = 27509.42f;
|
|
float noise_gate_slope = 0.3f;
|
|
size_t render_pre_window_size = 1;
|
|
size_t render_post_window_size = 1;
|
|
} echo_model;
|
|
|
|
struct ComfortNoise {
|
|
float noise_floor_dbfs = -96.03406f;
|
|
} comfort_noise;
|
|
|
|
struct Suppressor {
|
|
Suppressor();
|
|
Suppressor(const Suppressor& e);
|
|
Suppressor& operator=(const Suppressor& e);
|
|
|
|
size_t nearend_average_blocks = 4;
|
|
|
|
struct MaskingThresholds {
|
|
MaskingThresholds(float enr_transparent,
|
|
float enr_suppress,
|
|
float emr_transparent);
|
|
MaskingThresholds(const MaskingThresholds& e);
|
|
MaskingThresholds& operator=(const MaskingThresholds& e);
|
|
float enr_transparent;
|
|
float enr_suppress;
|
|
float emr_transparent;
|
|
};
|
|
|
|
struct Tuning {
|
|
Tuning(MaskingThresholds mask_lf,
|
|
MaskingThresholds mask_hf,
|
|
float max_inc_factor,
|
|
float max_dec_factor_lf);
|
|
Tuning(const Tuning& e);
|
|
Tuning& operator=(const Tuning& e);
|
|
MaskingThresholds mask_lf;
|
|
MaskingThresholds mask_hf;
|
|
float max_inc_factor;
|
|
float max_dec_factor_lf;
|
|
};
|
|
|
|
Tuning normal_tuning = Tuning(MaskingThresholds(.3f, .4f, .3f),
|
|
MaskingThresholds(.07f, .1f, .3f),
|
|
2.0f,
|
|
0.25f);
|
|
Tuning nearend_tuning = Tuning(MaskingThresholds(1.09f, 1.1f, .3f),
|
|
MaskingThresholds(.1f, .3f, .3f),
|
|
2.0f,
|
|
0.25f);
|
|
|
|
struct DominantNearendDetection {
|
|
float enr_threshold = .25f;
|
|
float enr_exit_threshold = 10.f;
|
|
float snr_threshold = 30.f;
|
|
int hold_duration = 50;
|
|
int trigger_threshold = 12;
|
|
bool use_during_initial_phase = true;
|
|
} dominant_nearend_detection;
|
|
|
|
struct SubbandNearendDetection {
|
|
size_t nearend_average_blocks = 1;
|
|
struct SubbandRegion {
|
|
size_t low;
|
|
size_t high;
|
|
};
|
|
SubbandRegion subband1 = {1, 1};
|
|
SubbandRegion subband2 = {1, 1};
|
|
float nearend_threshold = 1.f;
|
|
float snr_threshold = 1.f;
|
|
} subband_nearend_detection;
|
|
|
|
bool use_subband_nearend_detection = false;
|
|
|
|
struct HighBandsSuppression {
|
|
float enr_threshold = 1.f;
|
|
float max_gain_during_echo = 1.f;
|
|
float anti_howling_activation_threshold = 25.f;
|
|
float anti_howling_gain = 0.01f;
|
|
} high_bands_suppression;
|
|
|
|
float floor_first_increase = 0.00001f;
|
|
} suppressor;
|
|
};
|
|
} // namespace webrtc
|
|
|
|
#endif // API_AUDIO_ECHO_CANCELLER3_CONFIG_H_
|