/* * Copyright (c) 2016 The WebRTC project authors. All Rights Reserved. * * Use of this source code is governed by a BSD-style license * that can be found in the LICENSE file in the root of the source * tree. An additional intellectual property rights grant can be found * in the file PATENTS. All contributing project authors may * be found in the AUTHORS file in the root of the source tree. */ #include #include "api/array_view.h" #include "modules/audio_processing/audio_buffer.h" #include "modules/audio_processing/test/audio_buffer_tools.h" #include "modules/audio_processing/test/bitexactness_tools.h" #include "modules/audio_processing/voice_detection_impl.h" #include "test/gtest.h" namespace webrtc { namespace { const int kNumFramesToProcess = 1000; // Process one frame of data and produce the output. void ProcessOneFrame(int sample_rate_hz, AudioBuffer* audio_buffer, VoiceDetectionImpl* voice_detection) { if (sample_rate_hz > AudioProcessing::kSampleRate16kHz) { audio_buffer->SplitIntoFrequencyBands(); } voice_detection->ProcessCaptureAudio(audio_buffer); } // Processes a specified amount of frames, verifies the results and reports // any errors. void RunBitexactnessTest(int sample_rate_hz, size_t num_channels, int frame_size_ms_reference, bool stream_has_voice_reference, VoiceDetection::Likelihood likelihood_reference) { rtc::CriticalSection crit_capture; VoiceDetectionImpl voice_detection(&crit_capture); voice_detection.Initialize(sample_rate_hz > 16000 ? 16000 : sample_rate_hz); voice_detection.Enable(true); int samples_per_channel = rtc::CheckedDivExact(sample_rate_hz, 100); const StreamConfig capture_config(sample_rate_hz, num_channels, false); AudioBuffer capture_buffer( capture_config.num_frames(), capture_config.num_channels(), capture_config.num_frames(), capture_config.num_channels(), capture_config.num_frames()); test::InputAudioFile capture_file( test::GetApmCaptureTestVectorFileName(sample_rate_hz)); std::vector capture_input(samples_per_channel * num_channels); for (int frame_no = 0; frame_no < kNumFramesToProcess; ++frame_no) { ReadFloatSamplesFromStereoFile(samples_per_channel, num_channels, &capture_file, capture_input); test::CopyVectorToAudioBuffer(capture_config, capture_input, &capture_buffer); ProcessOneFrame(sample_rate_hz, &capture_buffer, &voice_detection); } int frame_size_ms = voice_detection.frame_size_ms(); bool stream_has_voice = voice_detection.stream_has_voice(); VoiceDetection::Likelihood likelihood = voice_detection.likelihood(); // Compare the outputs to the references. EXPECT_EQ(frame_size_ms_reference, frame_size_ms); EXPECT_EQ(stream_has_voice_reference, stream_has_voice); EXPECT_EQ(likelihood_reference, likelihood); } const int kFrameSizeMsReference = 10; const bool kStreamHasVoiceReference = true; const VoiceDetection::Likelihood kLikelihoodReference = VoiceDetection::kLowLikelihood; } // namespace TEST(VoiceDetectionBitExactnessTest, Mono8kHz) { RunBitexactnessTest(8000, 1, kFrameSizeMsReference, kStreamHasVoiceReference, kLikelihoodReference); } TEST(VoiceDetectionBitExactnessTest, Mono16kHz) { RunBitexactnessTest(16000, 1, kFrameSizeMsReference, kStreamHasVoiceReference, kLikelihoodReference); } TEST(VoiceDetectionBitExactnessTest, Mono32kHz) { RunBitexactnessTest(32000, 1, kFrameSizeMsReference, kStreamHasVoiceReference, kLikelihoodReference); } TEST(VoiceDetectionBitExactnessTest, Mono48kHz) { RunBitexactnessTest(48000, 1, kFrameSizeMsReference, kStreamHasVoiceReference, kLikelihoodReference); } TEST(VoiceDetectionBitExactnessTest, Stereo8kHz) { RunBitexactnessTest(8000, 2, kFrameSizeMsReference, kStreamHasVoiceReference, kLikelihoodReference); } TEST(VoiceDetectionBitExactnessTest, Stereo16kHz) { RunBitexactnessTest(16000, 2, kFrameSizeMsReference, kStreamHasVoiceReference, kLikelihoodReference); } TEST(VoiceDetectionBitExactnessTest, Stereo32kHz) { RunBitexactnessTest(32000, 2, kFrameSizeMsReference, kStreamHasVoiceReference, kLikelihoodReference); } TEST(VoiceDetectionBitExactnessTest, Stereo48kHz) { RunBitexactnessTest(48000, 2, kFrameSizeMsReference, kStreamHasVoiceReference, kLikelihoodReference); } } // namespace webrtc