mirror of
https://github.com/mollyim/webrtc.git
synced 2025-05-13 05:40:42 +01:00

This reverts commit b4e06d032e
.
Reason for revert: breaking downstream projects
Original change's description:
> Remove unused APM voice activity detection sub-module
>
> API changes:
> - webrtc::AudioProcessing::Config::VoiceDetection removed
> - webrtc::AudioProcessingStats::voice_detected deprecated
> - cricket::AudioOptions::typing_detection deprecated
> - webrtc::StatsReport::StatsValueName::
> kStatsValueNameTypingNoiseState deprecated
>
> PSA: https://groups.google.com/g/discuss-webrtc/c/7X6uwmJarE0
>
> Bug: webrtc:11226,webrtc:11292
> Change-Id: I8d008b56708cf62961b9857ec052b59fda3b41bf
> Reviewed-on: https://webrtc-review.googlesource.com/c/src/+/250666
> Reviewed-by: Harald Alvestrand <hta@webrtc.org>
> Reviewed-by: Gustaf Ullberg <gustaf@webrtc.org>
> Reviewed-by: Sam Zackrisson <saza@webrtc.org>
> Reviewed-by: Björn Terelius <terelius@webrtc.org>
> Commit-Queue: Alessio Bazzica <alessiob@webrtc.org>
> Cr-Commit-Position: refs/heads/main@{#35975}
TBR=gustaf@webrtc.org,saza@webrtc.org,alessiob@webrtc.org,terelius@webrtc.org,hta@webrtc.org,webrtc-scoped@luci-project-accounts.iam.gserviceaccount.com
Change-Id: Iee01fdb874b4e0331277f3ffe60dacaabc3859a2
No-Presubmit: true
No-Tree-Checks: true
No-Try: true
Bug: webrtc:11226,webrtc:11292
Reviewed-on: https://webrtc-review.googlesource.com/c/src/+/251600
Reviewed-by: Harald Alvestrand <hta@webrtc.org>
Reviewed-by: Gustaf Ullberg <gustaf@webrtc.org>
Commit-Queue: Mirko Bonadei <mbonadei@webrtc.org>
Cr-Commit-Position: refs/heads/main@{#35977}
59 lines
1.7 KiB
C++
59 lines
1.7 KiB
C++
/*
|
|
* Copyright (c) 2019 The WebRTC project authors. All Rights Reserved.
|
|
*
|
|
* Use of this source code is governed by a BSD-style license
|
|
* that can be found in the LICENSE file in the root of the source
|
|
* tree. An additional intellectual property rights grant can be found
|
|
* in the file PATENTS. All contributing project authors may
|
|
* be found in the AUTHORS file in the root of the source tree.
|
|
*/
|
|
|
|
#ifndef MODULES_AUDIO_PROCESSING_VOICE_DETECTION_H_
|
|
#define MODULES_AUDIO_PROCESSING_VOICE_DETECTION_H_
|
|
|
|
#include <stddef.h>
|
|
|
|
#include <memory>
|
|
|
|
#include "modules/audio_processing/include/audio_processing.h"
|
|
|
|
namespace webrtc {
|
|
|
|
class AudioBuffer;
|
|
|
|
// The voice activity detection (VAD) component analyzes the stream to
|
|
// determine if voice is present.
|
|
class VoiceDetection {
|
|
public:
|
|
// Specifies the likelihood that a frame will be declared to contain voice.
|
|
// A higher value makes it more likely that speech will not be clipped, at
|
|
// the expense of more noise being detected as voice.
|
|
enum Likelihood {
|
|
kVeryLowLikelihood,
|
|
kLowLikelihood,
|
|
kModerateLikelihood,
|
|
kHighLikelihood
|
|
};
|
|
|
|
VoiceDetection(int sample_rate_hz, Likelihood likelihood);
|
|
~VoiceDetection();
|
|
|
|
VoiceDetection(VoiceDetection&) = delete;
|
|
VoiceDetection& operator=(VoiceDetection&) = delete;
|
|
|
|
// Returns true if voice is detected in the current frame.
|
|
bool ProcessCaptureAudio(AudioBuffer* audio);
|
|
|
|
Likelihood likelihood() const { return likelihood_; }
|
|
|
|
private:
|
|
class Vad;
|
|
|
|
int sample_rate_hz_;
|
|
size_t frame_size_samples_;
|
|
Likelihood likelihood_;
|
|
std::unique_ptr<Vad> vad_;
|
|
};
|
|
} // namespace webrtc
|
|
|
|
#endif // MODULES_AUDIO_PROCESSING_VOICE_DETECTION_H_
|