mirror of
https://github.com/mollyim/webrtc.git
synced 2025-05-12 21:30:45 +01:00

To quote rfc6464: The audio level for digital silence -- for a muted audio source, for example -- MUST be represented as 127 (-127 dBov), regardless of the dynamic range of the encoded audio format. The behavior in webrtc is correct that digital silence is represented with 127, but it is also possible to get a value of 127 for not quite digitally silent audio buffer (as in, not strictly 0s). Bug: webrtc:14029 Change-Id: I7ff8698a7e4d5c0960c667fd1cc961838e269456 Reviewed-on: https://webrtc-review.googlesource.com/c/src/+/261244 Commit-Queue: Tomas Gunnarsson <tommi@webrtc.org> Reviewed-by: Per Åhgren <peah@webrtc.org> Cr-Commit-Position: refs/heads/main@{#36793}
138 lines
4.1 KiB
C++
138 lines
4.1 KiB
C++
/*
|
|
* Copyright (c) 2014 The WebRTC project authors. All Rights Reserved.
|
|
*
|
|
* Use of this source code is governed by a BSD-style license
|
|
* that can be found in the LICENSE file in the root of the source
|
|
* tree. An additional intellectual property rights grant can be found
|
|
* in the file PATENTS. All contributing project authors may
|
|
* be found in the AUTHORS file in the root of the source tree.
|
|
*/
|
|
|
|
#include "modules/audio_processing/rms_level.h"
|
|
|
|
#include <algorithm>
|
|
#include <cmath>
|
|
#include <numeric>
|
|
|
|
#include "rtc_base/checks.h"
|
|
|
|
namespace webrtc {
|
|
namespace {
|
|
static constexpr float kMaxSquaredLevel = 32768 * 32768;
|
|
// kMinLevel is the level corresponding to kMinLevelDb, that is 10^(-127/10).
|
|
static constexpr float kMinLevel = 1.995262314968883e-13f;
|
|
|
|
// Calculates the normalized RMS value from a mean square value. The input
|
|
// should be the sum of squared samples divided by the number of samples. The
|
|
// value will be normalized to full range before computing the RMS, wich is
|
|
// returned as a negated dBfs. That is, 0 is full amplitude while 127 is very
|
|
// faint.
|
|
int ComputeRms(float mean_square) {
|
|
if (mean_square <= kMinLevel * kMaxSquaredLevel) {
|
|
// Very faint; simply return the minimum value.
|
|
return RmsLevel::kMinLevelDb;
|
|
}
|
|
// Normalize by the max level.
|
|
const float mean_square_norm = mean_square / kMaxSquaredLevel;
|
|
RTC_DCHECK_GT(mean_square_norm, kMinLevel);
|
|
// 20log_10(x^0.5) = 10log_10(x)
|
|
const float rms = 10.f * std::log10(mean_square_norm);
|
|
RTC_DCHECK_LE(rms, 0.f);
|
|
RTC_DCHECK_GT(rms, -RmsLevel::kMinLevelDb);
|
|
// Return the negated value.
|
|
return static_cast<int>(-rms + 0.5f);
|
|
}
|
|
} // namespace
|
|
|
|
RmsLevel::RmsLevel() {
|
|
Reset();
|
|
}
|
|
|
|
RmsLevel::~RmsLevel() = default;
|
|
|
|
void RmsLevel::Reset() {
|
|
sum_square_ = 0.f;
|
|
sample_count_ = 0;
|
|
max_sum_square_ = 0.f;
|
|
block_size_ = absl::nullopt;
|
|
}
|
|
|
|
void RmsLevel::Analyze(rtc::ArrayView<const int16_t> data) {
|
|
if (data.empty()) {
|
|
return;
|
|
}
|
|
|
|
CheckBlockSize(data.size());
|
|
|
|
const float sum_square =
|
|
std::accumulate(data.begin(), data.end(), 0.f,
|
|
[](float a, int16_t b) { return a + b * b; });
|
|
RTC_DCHECK_GE(sum_square, 0.f);
|
|
sum_square_ += sum_square;
|
|
sample_count_ += data.size();
|
|
|
|
max_sum_square_ = std::max(max_sum_square_, sum_square);
|
|
}
|
|
|
|
void RmsLevel::Analyze(rtc::ArrayView<const float> data) {
|
|
if (data.empty()) {
|
|
return;
|
|
}
|
|
|
|
CheckBlockSize(data.size());
|
|
|
|
float sum_square = 0.f;
|
|
|
|
for (float data_k : data) {
|
|
int16_t tmp =
|
|
static_cast<int16_t>(std::min(std::max(data_k, -32768.f), 32767.f));
|
|
sum_square += tmp * tmp;
|
|
}
|
|
RTC_DCHECK_GE(sum_square, 0.f);
|
|
sum_square_ += sum_square;
|
|
sample_count_ += data.size();
|
|
|
|
max_sum_square_ = std::max(max_sum_square_, sum_square);
|
|
}
|
|
|
|
void RmsLevel::AnalyzeMuted(size_t length) {
|
|
CheckBlockSize(length);
|
|
sample_count_ += length;
|
|
}
|
|
|
|
int RmsLevel::Average() {
|
|
const bool have_samples = (sample_count_ != 0);
|
|
int rms = have_samples ? ComputeRms(sum_square_ / sample_count_)
|
|
: RmsLevel::kMinLevelDb;
|
|
|
|
// To ensure that kMinLevelDb represents digital silence (muted audio
|
|
// sources) we'll check here if the sum_square is actually 0. If it's not
|
|
// we'll bump up the return value to `kInaudibleButNotMuted`.
|
|
// https://datatracker.ietf.org/doc/html/rfc6464
|
|
if (have_samples && rms == RmsLevel::kMinLevelDb && sum_square_ != 0.0f) {
|
|
rms = kInaudibleButNotMuted;
|
|
}
|
|
|
|
Reset();
|
|
return rms;
|
|
}
|
|
|
|
RmsLevel::Levels RmsLevel::AverageAndPeak() {
|
|
// Note that block_size_ should by design always be non-empty when
|
|
// sample_count_ != 0. Also, the * operator of absl::optional enforces this
|
|
// with a DCHECK.
|
|
Levels levels = (sample_count_ == 0)
|
|
? Levels{RmsLevel::kMinLevelDb, RmsLevel::kMinLevelDb}
|
|
: Levels{ComputeRms(sum_square_ / sample_count_),
|
|
ComputeRms(max_sum_square_ / *block_size_)};
|
|
Reset();
|
|
return levels;
|
|
}
|
|
|
|
void RmsLevel::CheckBlockSize(size_t block_size) {
|
|
if (block_size_ != block_size) {
|
|
Reset();
|
|
block_size_ = block_size;
|
|
}
|
|
}
|
|
} // namespace webrtc
|