mirror of
https://github.com/mollyim/webrtc.git
synced 2025-05-13 05:40:42 +01:00
Disable high-pass filtering of the AEC reference
Currently the echo canceller reference signal is high-pass filtered to avoid the need of modeling the capture-side high-pass filter as part of the echo path. This can lead to the lowest frequency bins of the linear filter diverging as there is little low-frequency content available for training. Over time the filter can output an increasing amount of low-frequency power, which in turn affects the filter's ability to adapt properly. Disabling the high-pass filtering of the echo canceller reference solves this issue, resulting in improved filter convergence. Bug: webrtc:12265 Change-Id: Ic526a4b1b73e1808cfcd96a8cdee801b96a27671 Reviewed-on: https://webrtc-review.googlesource.com/c/src/+/208288 Reviewed-by: Per Åhgren <peah@webrtc.org> Commit-Queue: Gustaf Ullberg <gustaf@webrtc.org> Cr-Commit-Position: refs/heads/master@{#33322}
This commit is contained in:
parent
e5caa9e2d3
commit
09226fc832
8 changed files with 28 additions and 12 deletions
|
@ -90,6 +90,7 @@ struct RTC_EXPORT EchoCanceller3Config {
|
||||||
bool conservative_initial_phase = false;
|
bool conservative_initial_phase = false;
|
||||||
bool enable_coarse_filter_output_usage = true;
|
bool enable_coarse_filter_output_usage = true;
|
||||||
bool use_linear_filter = true;
|
bool use_linear_filter = true;
|
||||||
|
bool high_pass_filter_echo_reference = false;
|
||||||
bool export_linear_aec_output = false;
|
bool export_linear_aec_output = false;
|
||||||
} filter;
|
} filter;
|
||||||
|
|
||||||
|
|
|
@ -230,6 +230,8 @@ void Aec3ConfigFromJsonString(absl::string_view json_string,
|
||||||
ReadParam(section, "enable_coarse_filter_output_usage",
|
ReadParam(section, "enable_coarse_filter_output_usage",
|
||||||
&cfg.filter.enable_coarse_filter_output_usage);
|
&cfg.filter.enable_coarse_filter_output_usage);
|
||||||
ReadParam(section, "use_linear_filter", &cfg.filter.use_linear_filter);
|
ReadParam(section, "use_linear_filter", &cfg.filter.use_linear_filter);
|
||||||
|
ReadParam(section, "high_pass_filter_echo_reference",
|
||||||
|
&cfg.filter.high_pass_filter_echo_reference);
|
||||||
ReadParam(section, "export_linear_aec_output",
|
ReadParam(section, "export_linear_aec_output",
|
||||||
&cfg.filter.export_linear_aec_output);
|
&cfg.filter.export_linear_aec_output);
|
||||||
}
|
}
|
||||||
|
@ -513,6 +515,9 @@ std::string Aec3ConfigToJsonString(const EchoCanceller3Config& config) {
|
||||||
<< ",";
|
<< ",";
|
||||||
ost << "\"use_linear_filter\": "
|
ost << "\"use_linear_filter\": "
|
||||||
<< (config.filter.use_linear_filter ? "true" : "false") << ",";
|
<< (config.filter.use_linear_filter ? "true" : "false") << ",";
|
||||||
|
ost << "\"high_pass_filter_echo_reference\": "
|
||||||
|
<< (config.filter.high_pass_filter_echo_reference ? "true" : "false")
|
||||||
|
<< ",";
|
||||||
ost << "\"export_linear_aec_output\": "
|
ost << "\"export_linear_aec_output\": "
|
||||||
<< (config.filter.export_linear_aec_output ? "true" : "false");
|
<< (config.filter.export_linear_aec_output ? "true" : "false");
|
||||||
|
|
||||||
|
|
|
@ -21,6 +21,8 @@ TEST(EchoCanceller3JsonHelpers, ToStringAndParseJson) {
|
||||||
cfg.delay.log_warning_on_delay_changes = true;
|
cfg.delay.log_warning_on_delay_changes = true;
|
||||||
cfg.filter.refined.error_floor = 2.f;
|
cfg.filter.refined.error_floor = 2.f;
|
||||||
cfg.filter.coarse_initial.length_blocks = 3u;
|
cfg.filter.coarse_initial.length_blocks = 3u;
|
||||||
|
cfg.filter.high_pass_filter_echo_reference =
|
||||||
|
!cfg.filter.high_pass_filter_echo_reference;
|
||||||
cfg.comfort_noise.noise_floor_dbfs = 100.f;
|
cfg.comfort_noise.noise_floor_dbfs = 100.f;
|
||||||
cfg.echo_model.model_reverb_in_nonlinear_mode = false;
|
cfg.echo_model.model_reverb_in_nonlinear_mode = false;
|
||||||
cfg.suppressor.normal_tuning.mask_hf.enr_suppress = .5f;
|
cfg.suppressor.normal_tuning.mask_hf.enr_suppress = .5f;
|
||||||
|
@ -47,6 +49,8 @@ TEST(EchoCanceller3JsonHelpers, ToStringAndParseJson) {
|
||||||
cfg_transformed.filter.coarse_initial.length_blocks);
|
cfg_transformed.filter.coarse_initial.length_blocks);
|
||||||
EXPECT_EQ(cfg.filter.refined.error_floor,
|
EXPECT_EQ(cfg.filter.refined.error_floor,
|
||||||
cfg_transformed.filter.refined.error_floor);
|
cfg_transformed.filter.refined.error_floor);
|
||||||
|
EXPECT_EQ(cfg.filter.high_pass_filter_echo_reference,
|
||||||
|
cfg_transformed.filter.high_pass_filter_echo_reference);
|
||||||
EXPECT_EQ(cfg.comfort_noise.noise_floor_dbfs,
|
EXPECT_EQ(cfg.comfort_noise.noise_floor_dbfs,
|
||||||
cfg_transformed.comfort_noise.noise_floor_dbfs);
|
cfg_transformed.comfort_noise.noise_floor_dbfs);
|
||||||
EXPECT_EQ(cfg.echo_model.model_reverb_in_nonlinear_mode,
|
EXPECT_EQ(cfg.echo_model.model_reverb_in_nonlinear_mode,
|
||||||
|
|
|
@ -251,6 +251,10 @@ EchoCanceller3Config AdjustConfig(const EchoCanceller3Config& config) {
|
||||||
adjusted_cfg.filter.initial_state_seconds = 2.0f;
|
adjusted_cfg.filter.initial_state_seconds = 2.0f;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
if (field_trial::IsEnabled("WebRTC-Aec3HighPassFilterEchoReference")) {
|
||||||
|
adjusted_cfg.filter.high_pass_filter_echo_reference = true;
|
||||||
|
}
|
||||||
|
|
||||||
if (field_trial::IsEnabled("WebRTC-Aec3EchoSaturationDetectionKillSwitch")) {
|
if (field_trial::IsEnabled("WebRTC-Aec3EchoSaturationDetectionKillSwitch")) {
|
||||||
adjusted_cfg.ep_strength.echo_can_saturate = false;
|
adjusted_cfg.ep_strength.echo_can_saturate = false;
|
||||||
}
|
}
|
||||||
|
@ -574,6 +578,7 @@ EchoCanceller3Config AdjustConfig(const EchoCanceller3Config& config) {
|
||||||
class EchoCanceller3::RenderWriter {
|
class EchoCanceller3::RenderWriter {
|
||||||
public:
|
public:
|
||||||
RenderWriter(ApmDataDumper* data_dumper,
|
RenderWriter(ApmDataDumper* data_dumper,
|
||||||
|
const EchoCanceller3Config& config,
|
||||||
SwapQueue<std::vector<std::vector<std::vector<float>>>,
|
SwapQueue<std::vector<std::vector<std::vector<float>>>,
|
||||||
Aec3RenderQueueItemVerifier>* render_transfer_queue,
|
Aec3RenderQueueItemVerifier>* render_transfer_queue,
|
||||||
size_t num_bands,
|
size_t num_bands,
|
||||||
|
@ -590,7 +595,7 @@ class EchoCanceller3::RenderWriter {
|
||||||
ApmDataDumper* data_dumper_;
|
ApmDataDumper* data_dumper_;
|
||||||
const size_t num_bands_;
|
const size_t num_bands_;
|
||||||
const size_t num_channels_;
|
const size_t num_channels_;
|
||||||
HighPassFilter high_pass_filter_;
|
std::unique_ptr<HighPassFilter> high_pass_filter_;
|
||||||
std::vector<std::vector<std::vector<float>>> render_queue_input_frame_;
|
std::vector<std::vector<std::vector<float>>> render_queue_input_frame_;
|
||||||
SwapQueue<std::vector<std::vector<std::vector<float>>>,
|
SwapQueue<std::vector<std::vector<std::vector<float>>>,
|
||||||
Aec3RenderQueueItemVerifier>* render_transfer_queue_;
|
Aec3RenderQueueItemVerifier>* render_transfer_queue_;
|
||||||
|
@ -598,6 +603,7 @@ class EchoCanceller3::RenderWriter {
|
||||||
|
|
||||||
EchoCanceller3::RenderWriter::RenderWriter(
|
EchoCanceller3::RenderWriter::RenderWriter(
|
||||||
ApmDataDumper* data_dumper,
|
ApmDataDumper* data_dumper,
|
||||||
|
const EchoCanceller3Config& config,
|
||||||
SwapQueue<std::vector<std::vector<std::vector<float>>>,
|
SwapQueue<std::vector<std::vector<std::vector<float>>>,
|
||||||
Aec3RenderQueueItemVerifier>* render_transfer_queue,
|
Aec3RenderQueueItemVerifier>* render_transfer_queue,
|
||||||
size_t num_bands,
|
size_t num_bands,
|
||||||
|
@ -605,7 +611,6 @@ EchoCanceller3::RenderWriter::RenderWriter(
|
||||||
: data_dumper_(data_dumper),
|
: data_dumper_(data_dumper),
|
||||||
num_bands_(num_bands),
|
num_bands_(num_bands),
|
||||||
num_channels_(num_channels),
|
num_channels_(num_channels),
|
||||||
high_pass_filter_(16000, num_channels),
|
|
||||||
render_queue_input_frame_(
|
render_queue_input_frame_(
|
||||||
num_bands_,
|
num_bands_,
|
||||||
std::vector<std::vector<float>>(
|
std::vector<std::vector<float>>(
|
||||||
|
@ -613,6 +618,9 @@ EchoCanceller3::RenderWriter::RenderWriter(
|
||||||
std::vector<float>(AudioBuffer::kSplitBandSize, 0.f))),
|
std::vector<float>(AudioBuffer::kSplitBandSize, 0.f))),
|
||||||
render_transfer_queue_(render_transfer_queue) {
|
render_transfer_queue_(render_transfer_queue) {
|
||||||
RTC_DCHECK(data_dumper);
|
RTC_DCHECK(data_dumper);
|
||||||
|
if (config.filter.high_pass_filter_echo_reference) {
|
||||||
|
high_pass_filter_ = std::make_unique<HighPassFilter>(16000, num_channels);
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
EchoCanceller3::RenderWriter::~RenderWriter() = default;
|
EchoCanceller3::RenderWriter::~RenderWriter() = default;
|
||||||
|
@ -631,7 +639,9 @@ void EchoCanceller3::RenderWriter::Insert(const AudioBuffer& input) {
|
||||||
|
|
||||||
CopyBufferIntoFrame(input, num_bands_, num_channels_,
|
CopyBufferIntoFrame(input, num_bands_, num_channels_,
|
||||||
&render_queue_input_frame_);
|
&render_queue_input_frame_);
|
||||||
high_pass_filter_.Process(&render_queue_input_frame_[0]);
|
if (high_pass_filter_) {
|
||||||
|
high_pass_filter_->Process(&render_queue_input_frame_[0]);
|
||||||
|
}
|
||||||
|
|
||||||
static_cast<void>(render_transfer_queue_->Insert(&render_queue_input_frame_));
|
static_cast<void>(render_transfer_queue_->Insert(&render_queue_input_frame_));
|
||||||
}
|
}
|
||||||
|
@ -704,7 +714,7 @@ EchoCanceller3::EchoCanceller3(const EchoCanceller3Config& config,
|
||||||
config_.delay.fixed_capture_delay_samples));
|
config_.delay.fixed_capture_delay_samples));
|
||||||
}
|
}
|
||||||
|
|
||||||
render_writer_.reset(new RenderWriter(data_dumper_.get(),
|
render_writer_.reset(new RenderWriter(data_dumper_.get(), config_,
|
||||||
&render_transfer_queue_, num_bands_,
|
&render_transfer_queue_, num_bands_,
|
||||||
num_render_channels_));
|
num_render_channels_));
|
||||||
|
|
||||||
|
|
|
@ -252,8 +252,6 @@ class EchoCanceller3Tester {
|
||||||
capture_output.push_back(capture_buffer_.split_bands(0)[0][k]);
|
capture_output.push_back(capture_buffer_.split_bands(0)[0][k]);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
HighPassFilter hp_filter(16000, 1);
|
|
||||||
hp_filter.Process(&render_input);
|
|
||||||
|
|
||||||
EXPECT_TRUE(
|
EXPECT_TRUE(
|
||||||
VerifyOutputFrameBitexactness(render_input[0], capture_output, -64));
|
VerifyOutputFrameBitexactness(render_input[0], capture_output, -64));
|
||||||
|
@ -545,8 +543,6 @@ class EchoCanceller3Tester {
|
||||||
capture_output.push_back(capture_buffer_.split_bands(0)[0][k]);
|
capture_output.push_back(capture_buffer_.split_bands(0)[0][k]);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
HighPassFilter hp_filter(16000, 1);
|
|
||||||
hp_filter.Process(&render_input);
|
|
||||||
|
|
||||||
EXPECT_TRUE(
|
EXPECT_TRUE(
|
||||||
VerifyOutputFrameBitexactness(render_input[0], capture_output, -64));
|
VerifyOutputFrameBitexactness(render_input[0], capture_output, -64));
|
||||||
|
|
|
@ -2216,7 +2216,7 @@ INSTANTIATE_TEST_SUITE_P(
|
||||||
std::make_tuple(32000, 44100, 16000, 44100, 19, 15),
|
std::make_tuple(32000, 44100, 16000, 44100, 19, 15),
|
||||||
std::make_tuple(32000, 32000, 48000, 32000, 40, 35),
|
std::make_tuple(32000, 32000, 48000, 32000, 40, 35),
|
||||||
std::make_tuple(32000, 32000, 32000, 32000, 0, 0),
|
std::make_tuple(32000, 32000, 32000, 32000, 0, 0),
|
||||||
std::make_tuple(32000, 32000, 16000, 32000, 40, 20),
|
std::make_tuple(32000, 32000, 16000, 32000, 39, 20),
|
||||||
std::make_tuple(32000, 16000, 48000, 16000, 25, 20),
|
std::make_tuple(32000, 16000, 48000, 16000, 25, 20),
|
||||||
std::make_tuple(32000, 16000, 32000, 16000, 25, 20),
|
std::make_tuple(32000, 16000, 32000, 16000, 25, 20),
|
||||||
std::make_tuple(32000, 16000, 16000, 16000, 25, 0),
|
std::make_tuple(32000, 16000, 16000, 16000, 25, 0),
|
||||||
|
@ -2231,7 +2231,7 @@ INSTANTIATE_TEST_SUITE_P(
|
||||||
std::make_tuple(16000, 32000, 32000, 32000, 25, 0),
|
std::make_tuple(16000, 32000, 32000, 32000, 25, 0),
|
||||||
std::make_tuple(16000, 32000, 16000, 32000, 25, 20),
|
std::make_tuple(16000, 32000, 16000, 32000, 25, 20),
|
||||||
std::make_tuple(16000, 16000, 48000, 16000, 39, 20),
|
std::make_tuple(16000, 16000, 48000, 16000, 39, 20),
|
||||||
std::make_tuple(16000, 16000, 32000, 16000, 40, 20),
|
std::make_tuple(16000, 16000, 32000, 16000, 39, 20),
|
||||||
std::make_tuple(16000, 16000, 16000, 16000, 0, 0)));
|
std::make_tuple(16000, 16000, 16000, 16000, 0, 0)));
|
||||||
|
|
||||||
#elif defined(WEBRTC_AUDIOPROC_FIXED_PROFILE)
|
#elif defined(WEBRTC_AUDIOPROC_FIXED_PROFILE)
|
||||||
|
|
|
@ -1 +1 @@
|
||||||
1dd2c11da1f1dec49f728881628c1348e07a19cd
|
749efdfd1e3c3ace434b3673dac9ce4938534449
|
|
@ -1 +1 @@
|
||||||
16e9d8f3b8b6c23b2b5100a1162acfe67acc37a7
|
78c1a84de332173863c997538aa19b8cdcba5020
|
Loading…
Reference in a new issue