mirror of
https://github.com/mollyim/webrtc.git
synced 2025-05-13 13:50:40 +01:00

This reverts commit 81c0cf287c
.
Reason for revert: internal test failures
Original change's description:
> Simplification and refactoring of the AudioBuffer code
>
> This CL performs a major refactoring and simplification
> of the AudioBuffer code that.
> -Removes 7 of the 9 internal buffers of the AudioBuffer.
> -Avoids the implicit copying required to keep the
> internal buffers in sync.
> -Removes all code relating to handling of fixed-point
> sample data in the AudioBuffer.
> -Changes the naming of the class methods to reflect
> that only floating point is handled.
> -Corrects some bugs in the code.
> -Extends the handling of internal downmixing to be
> more generic.
>
> Bug: webrtc:10882
> Change-Id: I12c8af156fbe366b154744a0a1b3d926bf7be572
> Reviewed-on: https://webrtc-review.googlesource.com/c/src/+/149828
> Commit-Queue: Per Åhgren <peah@webrtc.org>
> Reviewed-by: Gustaf Ullberg <gustaf@webrtc.org>
> Cr-Commit-Position: refs/heads/master@{#28928}
TBR=gustaf@webrtc.org,peah@webrtc.org
Change-Id: I2729e3ad24b3a9b40b368b84cb565c859e79b51e
No-Presubmit: true
No-Tree-Checks: true
No-Try: true
Bug: webrtc:10882
Reviewed-on: https://webrtc-review.googlesource.com/c/src/+/150084
Reviewed-by: Steve Anton <steveanton@webrtc.org>
Commit-Queue: Steve Anton <steveanton@webrtc.org>
Cr-Commit-Position: refs/heads/master@{#28931}
123 lines
4.6 KiB
C++
123 lines
4.6 KiB
C++
/*
|
|
* Copyright (c) 2016 The WebRTC project authors. All Rights Reserved.
|
|
*
|
|
* Use of this source code is governed by a BSD-style license
|
|
* that can be found in the LICENSE file in the root of the source
|
|
* tree. An additional intellectual property rights grant can be found
|
|
* in the file PATENTS. All contributing project authors may
|
|
* be found in the AUTHORS file in the root of the source tree.
|
|
*/
|
|
#include <vector>
|
|
|
|
#include "api/array_view.h"
|
|
#include "modules/audio_processing/audio_buffer.h"
|
|
#include "modules/audio_processing/test/audio_buffer_tools.h"
|
|
#include "modules/audio_processing/test/bitexactness_tools.h"
|
|
#include "modules/audio_processing/voice_detection_impl.h"
|
|
#include "test/gtest.h"
|
|
|
|
namespace webrtc {
|
|
namespace {
|
|
|
|
const int kNumFramesToProcess = 1000;
|
|
|
|
// Process one frame of data and produce the output.
|
|
void ProcessOneFrame(int sample_rate_hz,
|
|
AudioBuffer* audio_buffer,
|
|
VoiceDetectionImpl* voice_detection) {
|
|
if (sample_rate_hz > AudioProcessing::kSampleRate16kHz) {
|
|
audio_buffer->SplitIntoFrequencyBands();
|
|
}
|
|
|
|
voice_detection->ProcessCaptureAudio(audio_buffer);
|
|
}
|
|
|
|
// Processes a specified amount of frames, verifies the results and reports
|
|
// any errors.
|
|
void RunBitexactnessTest(int sample_rate_hz,
|
|
size_t num_channels,
|
|
int frame_size_ms_reference,
|
|
bool stream_has_voice_reference,
|
|
VoiceDetection::Likelihood likelihood_reference) {
|
|
rtc::CriticalSection crit_capture;
|
|
VoiceDetectionImpl voice_detection(&crit_capture);
|
|
voice_detection.Initialize(sample_rate_hz > 16000 ? 16000 : sample_rate_hz);
|
|
voice_detection.Enable(true);
|
|
|
|
int samples_per_channel = rtc::CheckedDivExact(sample_rate_hz, 100);
|
|
const StreamConfig capture_config(sample_rate_hz, num_channels, false);
|
|
AudioBuffer capture_buffer(
|
|
capture_config.num_frames(), capture_config.num_channels(),
|
|
capture_config.num_frames(), capture_config.num_channels(),
|
|
capture_config.num_frames());
|
|
test::InputAudioFile capture_file(
|
|
test::GetApmCaptureTestVectorFileName(sample_rate_hz));
|
|
std::vector<float> capture_input(samples_per_channel * num_channels);
|
|
for (int frame_no = 0; frame_no < kNumFramesToProcess; ++frame_no) {
|
|
ReadFloatSamplesFromStereoFile(samples_per_channel, num_channels,
|
|
&capture_file, capture_input);
|
|
|
|
test::CopyVectorToAudioBuffer(capture_config, capture_input,
|
|
&capture_buffer);
|
|
|
|
ProcessOneFrame(sample_rate_hz, &capture_buffer, &voice_detection);
|
|
}
|
|
|
|
int frame_size_ms = voice_detection.frame_size_ms();
|
|
bool stream_has_voice = voice_detection.stream_has_voice();
|
|
VoiceDetection::Likelihood likelihood = voice_detection.likelihood();
|
|
|
|
// Compare the outputs to the references.
|
|
EXPECT_EQ(frame_size_ms_reference, frame_size_ms);
|
|
EXPECT_EQ(stream_has_voice_reference, stream_has_voice);
|
|
EXPECT_EQ(likelihood_reference, likelihood);
|
|
}
|
|
|
|
const int kFrameSizeMsReference = 10;
|
|
const bool kStreamHasVoiceReference = true;
|
|
const VoiceDetection::Likelihood kLikelihoodReference =
|
|
VoiceDetection::kLowLikelihood;
|
|
|
|
} // namespace
|
|
|
|
TEST(VoiceDetectionBitExactnessTest, Mono8kHz) {
|
|
RunBitexactnessTest(8000, 1, kFrameSizeMsReference, kStreamHasVoiceReference,
|
|
kLikelihoodReference);
|
|
}
|
|
|
|
TEST(VoiceDetectionBitExactnessTest, Mono16kHz) {
|
|
RunBitexactnessTest(16000, 1, kFrameSizeMsReference, kStreamHasVoiceReference,
|
|
kLikelihoodReference);
|
|
}
|
|
|
|
TEST(VoiceDetectionBitExactnessTest, Mono32kHz) {
|
|
RunBitexactnessTest(32000, 1, kFrameSizeMsReference, kStreamHasVoiceReference,
|
|
kLikelihoodReference);
|
|
}
|
|
|
|
TEST(VoiceDetectionBitExactnessTest, Mono48kHz) {
|
|
RunBitexactnessTest(48000, 1, kFrameSizeMsReference, kStreamHasVoiceReference,
|
|
kLikelihoodReference);
|
|
}
|
|
|
|
TEST(VoiceDetectionBitExactnessTest, Stereo8kHz) {
|
|
RunBitexactnessTest(8000, 2, kFrameSizeMsReference, kStreamHasVoiceReference,
|
|
kLikelihoodReference);
|
|
}
|
|
|
|
TEST(VoiceDetectionBitExactnessTest, Stereo16kHz) {
|
|
RunBitexactnessTest(16000, 2, kFrameSizeMsReference, kStreamHasVoiceReference,
|
|
kLikelihoodReference);
|
|
}
|
|
|
|
TEST(VoiceDetectionBitExactnessTest, Stereo32kHz) {
|
|
RunBitexactnessTest(32000, 2, kFrameSizeMsReference, kStreamHasVoiceReference,
|
|
kLikelihoodReference);
|
|
}
|
|
|
|
TEST(VoiceDetectionBitExactnessTest, Stereo48kHz) {
|
|
RunBitexactnessTest(48000, 2, kFrameSizeMsReference, kStreamHasVoiceReference,
|
|
kLikelihoodReference);
|
|
}
|
|
|
|
} // namespace webrtc
|