mirror of
https://github.com/mollyim/webrtc.git
synced 2025-05-13 05:40:42 +01:00

Bug: webrtc:342905193 No-Try: True Change-Id: Icc968be43b8830038ea9a1f5f604307220457807 Reviewed-on: https://webrtc-review.googlesource.com/c/src/+/361021 Auto-Submit: Florent Castelli <orphis@webrtc.org> Reviewed-by: Harald Alvestrand <hta@webrtc.org> Commit-Queue: Florent Castelli <orphis@webrtc.org> Cr-Commit-Position: refs/heads/main@{#42911}
432 lines
16 KiB
C++
432 lines
16 KiB
C++
/*
|
|
* Copyright (c) 2022 The WebRTC project authors. All Rights Reserved.
|
|
*
|
|
* Use of this source code is governed by a BSD-style license
|
|
* that can be found in the LICENSE file in the root of the source
|
|
* tree. An additional intellectual property rights grant can be found
|
|
* in the file PATENTS. All contributing project authors may
|
|
* be found in the AUTHORS file in the root of the source tree.
|
|
*/
|
|
|
|
#include "video/video_stream_buffer_controller.h"
|
|
|
|
#include <algorithm>
|
|
#include <memory>
|
|
#include <optional>
|
|
#include <utility>
|
|
|
|
#include "absl/base/attributes.h"
|
|
#include "absl/functional/bind_front.h"
|
|
#include "api/sequence_checker.h"
|
|
#include "api/task_queue/task_queue_base.h"
|
|
#include "api/units/data_size.h"
|
|
#include "api/units/time_delta.h"
|
|
#include "api/units/timestamp.h"
|
|
#include "api/video/encoded_frame.h"
|
|
#include "api/video/frame_buffer.h"
|
|
#include "api/video/video_content_type.h"
|
|
#include "modules/video_coding/frame_helpers.h"
|
|
#include "modules/video_coding/timing/inter_frame_delay_variation_calculator.h"
|
|
#include "modules/video_coding/timing/jitter_estimator.h"
|
|
#include "rtc_base/checks.h"
|
|
#include "rtc_base/logging.h"
|
|
#include "rtc_base/thread_annotations.h"
|
|
#include "video/frame_decode_scheduler.h"
|
|
#include "video/frame_decode_timing.h"
|
|
#include "video/task_queue_frame_decode_scheduler.h"
|
|
#include "video/video_receive_stream_timeout_tracker.h"
|
|
|
|
namespace webrtc {
|
|
|
|
namespace {
|
|
|
|
// Max number of frames the buffer will hold.
|
|
static constexpr size_t kMaxFramesBuffered = 800;
|
|
// Max number of decoded frame info that will be saved.
|
|
static constexpr int kMaxFramesHistory = 1 << 13;
|
|
|
|
// Default value for the maximum decode queue size that is used when the
|
|
// low-latency renderer is used.
|
|
static constexpr size_t kZeroPlayoutDelayDefaultMaxDecodeQueueSize = 8;
|
|
|
|
struct FrameMetadata {
|
|
explicit FrameMetadata(const EncodedFrame& frame)
|
|
: is_last_spatial_layer(frame.is_last_spatial_layer),
|
|
is_keyframe(frame.is_keyframe()),
|
|
size(frame.size()),
|
|
contentType(frame.contentType()),
|
|
delayed_by_retransmission(frame.delayed_by_retransmission()),
|
|
rtp_timestamp(frame.RtpTimestamp()),
|
|
receive_time(frame.ReceivedTimestamp()) {}
|
|
|
|
const bool is_last_spatial_layer;
|
|
const bool is_keyframe;
|
|
const size_t size;
|
|
const VideoContentType contentType;
|
|
const bool delayed_by_retransmission;
|
|
const uint32_t rtp_timestamp;
|
|
const std::optional<Timestamp> receive_time;
|
|
};
|
|
|
|
Timestamp MinReceiveTime(const EncodedFrame& frame) {
|
|
Timestamp first_recv_time = Timestamp::PlusInfinity();
|
|
for (const auto& packet_info : frame.PacketInfos()) {
|
|
if (packet_info.receive_time().IsFinite()) {
|
|
first_recv_time = std::min(first_recv_time, packet_info.receive_time());
|
|
}
|
|
}
|
|
return first_recv_time;
|
|
}
|
|
|
|
Timestamp ReceiveTime(const EncodedFrame& frame) {
|
|
std::optional<Timestamp> ts = frame.ReceivedTimestamp();
|
|
RTC_DCHECK(ts.has_value()) << "Received frame must have a timestamp set!";
|
|
return *ts;
|
|
}
|
|
|
|
} // namespace
|
|
|
|
VideoStreamBufferController::VideoStreamBufferController(
|
|
Clock* clock,
|
|
TaskQueueBase* worker_queue,
|
|
VCMTiming* timing,
|
|
VideoStreamBufferControllerStatsObserver* stats_proxy,
|
|
FrameSchedulingReceiver* receiver,
|
|
TimeDelta max_wait_for_keyframe,
|
|
TimeDelta max_wait_for_frame,
|
|
std::unique_ptr<FrameDecodeScheduler> frame_decode_scheduler,
|
|
const FieldTrialsView& field_trials)
|
|
: field_trials_(field_trials),
|
|
clock_(clock),
|
|
stats_proxy_(stats_proxy),
|
|
receiver_(receiver),
|
|
timing_(timing),
|
|
frame_decode_scheduler_(std::move(frame_decode_scheduler)),
|
|
jitter_estimator_(clock_, field_trials),
|
|
buffer_(std::make_unique<FrameBuffer>(kMaxFramesBuffered,
|
|
kMaxFramesHistory,
|
|
field_trials)),
|
|
decode_timing_(clock_, timing_),
|
|
timeout_tracker_(
|
|
clock_,
|
|
worker_queue,
|
|
VideoReceiveStreamTimeoutTracker::Timeouts{
|
|
.max_wait_for_keyframe = max_wait_for_keyframe,
|
|
.max_wait_for_frame = max_wait_for_frame},
|
|
absl::bind_front(&VideoStreamBufferController::OnTimeout, this)),
|
|
zero_playout_delay_max_decode_queue_size_(
|
|
"max_decode_queue_size",
|
|
kZeroPlayoutDelayDefaultMaxDecodeQueueSize) {
|
|
RTC_DCHECK(stats_proxy_);
|
|
RTC_DCHECK(receiver_);
|
|
RTC_DCHECK(timing_);
|
|
RTC_DCHECK(clock_);
|
|
RTC_DCHECK(frame_decode_scheduler_);
|
|
|
|
ParseFieldTrial({&zero_playout_delay_max_decode_queue_size_},
|
|
field_trials.Lookup("WebRTC-ZeroPlayoutDelay"));
|
|
}
|
|
|
|
void VideoStreamBufferController::Stop() {
|
|
RTC_DCHECK_RUN_ON(&worker_sequence_checker_);
|
|
frame_decode_scheduler_->Stop();
|
|
timeout_tracker_.Stop();
|
|
decoder_ready_for_new_frame_ = false;
|
|
}
|
|
|
|
void VideoStreamBufferController::SetProtectionMode(
|
|
VCMVideoProtection protection_mode) {
|
|
RTC_DCHECK_RUN_ON(&worker_sequence_checker_);
|
|
protection_mode_ = protection_mode;
|
|
}
|
|
|
|
void VideoStreamBufferController::Clear() {
|
|
RTC_DCHECK_RUN_ON(&worker_sequence_checker_);
|
|
stats_proxy_->OnDroppedFrames(buffer_->CurrentSize());
|
|
buffer_ = std::make_unique<FrameBuffer>(kMaxFramesBuffered, kMaxFramesHistory,
|
|
field_trials_);
|
|
frame_decode_scheduler_->CancelOutstanding();
|
|
}
|
|
|
|
std::optional<int64_t> VideoStreamBufferController::InsertFrame(
|
|
std::unique_ptr<EncodedFrame> frame) {
|
|
RTC_DCHECK_RUN_ON(&worker_sequence_checker_);
|
|
FrameMetadata metadata(*frame);
|
|
int complete_units = buffer_->GetTotalNumberOfContinuousTemporalUnits();
|
|
if (buffer_->InsertFrame(std::move(frame))) {
|
|
RTC_DCHECK(metadata.receive_time) << "Frame receive time must be set!";
|
|
if (!metadata.delayed_by_retransmission && metadata.receive_time &&
|
|
(field_trials_.IsDisabled("WebRTC-IncomingTimestampOnMarkerBitOnly") ||
|
|
metadata.is_last_spatial_layer)) {
|
|
timing_->IncomingTimestamp(metadata.rtp_timestamp,
|
|
*metadata.receive_time);
|
|
}
|
|
if (complete_units < buffer_->GetTotalNumberOfContinuousTemporalUnits()) {
|
|
stats_proxy_->OnCompleteFrame(metadata.is_keyframe, metadata.size,
|
|
metadata.contentType);
|
|
MaybeScheduleFrameForRelease();
|
|
}
|
|
}
|
|
|
|
return buffer_->LastContinuousFrameId();
|
|
}
|
|
|
|
void VideoStreamBufferController::UpdateRtt(int64_t max_rtt_ms) {
|
|
RTC_DCHECK_RUN_ON(&worker_sequence_checker_);
|
|
jitter_estimator_.UpdateRtt(TimeDelta::Millis(max_rtt_ms));
|
|
}
|
|
|
|
void VideoStreamBufferController::SetMaxWaits(TimeDelta max_wait_for_keyframe,
|
|
TimeDelta max_wait_for_frame) {
|
|
RTC_DCHECK_RUN_ON(&worker_sequence_checker_);
|
|
timeout_tracker_.SetTimeouts({.max_wait_for_keyframe = max_wait_for_keyframe,
|
|
.max_wait_for_frame = max_wait_for_frame});
|
|
}
|
|
|
|
void VideoStreamBufferController::StartNextDecode(bool keyframe_required) {
|
|
RTC_DCHECK_RUN_ON(&worker_sequence_checker_);
|
|
if (!timeout_tracker_.Running())
|
|
timeout_tracker_.Start(keyframe_required);
|
|
keyframe_required_ = keyframe_required;
|
|
if (keyframe_required_) {
|
|
timeout_tracker_.SetWaitingForKeyframe();
|
|
}
|
|
decoder_ready_for_new_frame_ = true;
|
|
MaybeScheduleFrameForRelease();
|
|
}
|
|
|
|
int VideoStreamBufferController::Size() {
|
|
RTC_DCHECK_RUN_ON(&worker_sequence_checker_);
|
|
return buffer_->CurrentSize();
|
|
}
|
|
|
|
void VideoStreamBufferController::OnFrameReady(
|
|
absl::InlinedVector<std::unique_ptr<EncodedFrame>, 4> frames,
|
|
Timestamp render_time) {
|
|
RTC_DCHECK_RUN_ON(&worker_sequence_checker_);
|
|
RTC_CHECK(!frames.empty())
|
|
<< "Callers must ensure there is at least one frame to decode.";
|
|
|
|
timeout_tracker_.OnEncodedFrameReleased();
|
|
|
|
Timestamp now = clock_->CurrentTime();
|
|
bool superframe_delayed_by_retransmission = false;
|
|
DataSize superframe_size = DataSize::Zero();
|
|
const EncodedFrame& first_frame = *frames.front();
|
|
Timestamp min_receive_time = MinReceiveTime(first_frame);
|
|
Timestamp max_receive_time = ReceiveTime(first_frame);
|
|
|
|
if (first_frame.is_keyframe())
|
|
keyframe_required_ = false;
|
|
|
|
// Gracefully handle bad RTP timestamps and render time issues.
|
|
if (FrameHasBadRenderTiming(render_time, now) ||
|
|
TargetVideoDelayIsTooLarge(timing_->TargetVideoDelay())) {
|
|
RTC_LOG(LS_WARNING) << "Resetting jitter estimator and timing module due "
|
|
"to bad render timing for rtp_timestamp="
|
|
<< first_frame.RtpTimestamp();
|
|
jitter_estimator_.Reset();
|
|
timing_->Reset();
|
|
render_time = timing_->RenderTime(first_frame.RtpTimestamp(), now);
|
|
}
|
|
|
|
for (std::unique_ptr<EncodedFrame>& frame : frames) {
|
|
frame->SetRenderTime(render_time.ms());
|
|
|
|
superframe_delayed_by_retransmission |= frame->delayed_by_retransmission();
|
|
min_receive_time = std::min(min_receive_time, MinReceiveTime(*frame));
|
|
max_receive_time = std::max(max_receive_time, ReceiveTime(*frame));
|
|
superframe_size += DataSize::Bytes(frame->size());
|
|
}
|
|
|
|
if (!superframe_delayed_by_retransmission) {
|
|
std::optional<TimeDelta> inter_frame_delay_variation =
|
|
ifdv_calculator_.Calculate(first_frame.RtpTimestamp(),
|
|
max_receive_time);
|
|
if (inter_frame_delay_variation) {
|
|
jitter_estimator_.UpdateEstimate(*inter_frame_delay_variation,
|
|
superframe_size);
|
|
}
|
|
|
|
static constexpr float kRttMult = 0.9f;
|
|
static constexpr TimeDelta kRttMultAddCap = TimeDelta::Millis(200);
|
|
timing_->SetJitterDelay(
|
|
jitter_estimator_.GetJitterEstimate(kRttMult, kRttMultAddCap));
|
|
timing_->UpdateCurrentDelay(render_time, now);
|
|
} else {
|
|
jitter_estimator_.FrameNacked();
|
|
}
|
|
|
|
// Update stats.
|
|
UpdateDroppedFrames();
|
|
UpdateFrameBufferTimings(min_receive_time, now);
|
|
UpdateTimingFrameInfo();
|
|
|
|
std::unique_ptr<EncodedFrame> frame =
|
|
CombineAndDeleteFrames(std::move(frames));
|
|
|
|
timing_->SetLastDecodeScheduledTimestamp(now);
|
|
|
|
decoder_ready_for_new_frame_ = false;
|
|
receiver_->OnEncodedFrame(std::move(frame));
|
|
}
|
|
|
|
void VideoStreamBufferController::OnTimeout(TimeDelta delay) {
|
|
RTC_DCHECK_RUN_ON(&worker_sequence_checker_);
|
|
|
|
// Stop sending timeouts until receiver starts waiting for a new frame.
|
|
timeout_tracker_.Stop();
|
|
|
|
// If the stream is paused then ignore the timeout.
|
|
if (!decoder_ready_for_new_frame_) {
|
|
return;
|
|
}
|
|
decoder_ready_for_new_frame_ = false;
|
|
receiver_->OnDecodableFrameTimeout(delay);
|
|
}
|
|
|
|
void VideoStreamBufferController::FrameReadyForDecode(uint32_t rtp_timestamp,
|
|
Timestamp render_time) {
|
|
RTC_DCHECK_RUN_ON(&worker_sequence_checker_);
|
|
// Check that the frame to decode is still valid before passing the frame for
|
|
// decoding.
|
|
auto decodable_tu_info = buffer_->DecodableTemporalUnitsInfo();
|
|
if (!decodable_tu_info) {
|
|
RTC_LOG(LS_ERROR)
|
|
<< "The frame buffer became undecodable during the wait "
|
|
"to decode frame with rtp-timestamp "
|
|
<< rtp_timestamp
|
|
<< ". Cancelling the decode of this frame, decoding "
|
|
"will resume when the frame buffers become decodable again.";
|
|
return;
|
|
}
|
|
RTC_DCHECK_EQ(rtp_timestamp, decodable_tu_info->next_rtp_timestamp)
|
|
<< "Frame buffer's next decodable frame was not the one sent for "
|
|
"extraction.";
|
|
auto frames = buffer_->ExtractNextDecodableTemporalUnit();
|
|
if (frames.empty()) {
|
|
RTC_LOG(LS_ERROR)
|
|
<< "The frame buffer should never return an empty temporal until list "
|
|
"when there is a decodable temporal unit.";
|
|
RTC_DCHECK_NOTREACHED();
|
|
return;
|
|
}
|
|
OnFrameReady(std::move(frames), render_time);
|
|
}
|
|
|
|
void VideoStreamBufferController::UpdateDroppedFrames()
|
|
RTC_RUN_ON(&worker_sequence_checker_) {
|
|
const int dropped_frames = buffer_->GetTotalNumberOfDroppedFrames() -
|
|
frames_dropped_before_last_new_frame_;
|
|
if (dropped_frames > 0)
|
|
stats_proxy_->OnDroppedFrames(dropped_frames);
|
|
frames_dropped_before_last_new_frame_ =
|
|
buffer_->GetTotalNumberOfDroppedFrames();
|
|
}
|
|
|
|
void VideoStreamBufferController::UpdateFrameBufferTimings(
|
|
Timestamp min_receive_time,
|
|
Timestamp now) {
|
|
// Update instantaneous delays.
|
|
auto timings = timing_->GetTimings();
|
|
if (timings.num_decoded_frames) {
|
|
stats_proxy_->OnFrameBufferTimingsUpdated(
|
|
timings.estimated_max_decode_time.ms(), timings.current_delay.ms(),
|
|
timings.target_delay.ms(), timings.minimum_delay.ms(),
|
|
timings.min_playout_delay.ms(), timings.render_delay.ms());
|
|
}
|
|
|
|
// The spec mandates that `jitterBufferDelay` is the "time the first
|
|
// packet is received by the jitter buffer (ingest timestamp) to the time it
|
|
// exits the jitter buffer (emit timestamp)". Since the "jitter buffer"
|
|
// is not a monolith in the webrtc.org implementation, we take the freedom to
|
|
// define "ingest timestamp" as "first packet received by
|
|
// RtpVideoStreamReceiver2" and "emit timestamp" as "decodable frame released
|
|
// by VideoStreamBufferController".
|
|
//
|
|
// https://w3c.github.io/webrtc-stats/#dom-rtcinboundrtpstreamstats-jitterbufferdelay
|
|
TimeDelta jitter_buffer_delay =
|
|
std::max(TimeDelta::Zero(), now - min_receive_time);
|
|
stats_proxy_->OnDecodableFrame(jitter_buffer_delay, timings.target_delay,
|
|
timings.minimum_delay);
|
|
}
|
|
|
|
void VideoStreamBufferController::UpdateTimingFrameInfo() {
|
|
std::optional<TimingFrameInfo> info = timing_->GetTimingFrameInfo();
|
|
if (info)
|
|
stats_proxy_->OnTimingFrameInfoUpdated(*info);
|
|
}
|
|
|
|
bool VideoStreamBufferController::IsTooManyFramesQueued() const
|
|
RTC_RUN_ON(&worker_sequence_checker_) {
|
|
return buffer_->CurrentSize() > zero_playout_delay_max_decode_queue_size_;
|
|
}
|
|
|
|
void VideoStreamBufferController::ForceKeyFrameReleaseImmediately()
|
|
RTC_RUN_ON(&worker_sequence_checker_) {
|
|
RTC_DCHECK(keyframe_required_);
|
|
// Iterate through the frame buffer until there is a complete keyframe and
|
|
// release this right away.
|
|
while (buffer_->DecodableTemporalUnitsInfo()) {
|
|
auto next_frame = buffer_->ExtractNextDecodableTemporalUnit();
|
|
if (next_frame.empty()) {
|
|
RTC_DCHECK_NOTREACHED()
|
|
<< "Frame buffer should always return at least 1 frame.";
|
|
continue;
|
|
}
|
|
// Found keyframe - decode right away.
|
|
if (next_frame.front()->is_keyframe()) {
|
|
auto render_time = timing_->RenderTime(next_frame.front()->RtpTimestamp(),
|
|
clock_->CurrentTime());
|
|
OnFrameReady(std::move(next_frame), render_time);
|
|
return;
|
|
}
|
|
}
|
|
}
|
|
|
|
void VideoStreamBufferController::MaybeScheduleFrameForRelease()
|
|
RTC_RUN_ON(&worker_sequence_checker_) {
|
|
auto decodable_tu_info = buffer_->DecodableTemporalUnitsInfo();
|
|
if (!decoder_ready_for_new_frame_ || !decodable_tu_info) {
|
|
return;
|
|
}
|
|
|
|
if (keyframe_required_) {
|
|
return ForceKeyFrameReleaseImmediately();
|
|
}
|
|
|
|
// If already scheduled then abort.
|
|
if (frame_decode_scheduler_->ScheduledRtpTimestamp() ==
|
|
decodable_tu_info->next_rtp_timestamp) {
|
|
return;
|
|
}
|
|
|
|
TimeDelta max_wait = timeout_tracker_.TimeUntilTimeout();
|
|
// Ensures the frame is scheduled for decode before the stream times out.
|
|
// This is otherwise a race condition.
|
|
max_wait = std::max(max_wait - TimeDelta::Millis(1), TimeDelta::Zero());
|
|
std::optional<FrameDecodeTiming::FrameSchedule> schedule;
|
|
while (decodable_tu_info) {
|
|
schedule = decode_timing_.OnFrameBufferUpdated(
|
|
decodable_tu_info->next_rtp_timestamp,
|
|
decodable_tu_info->last_rtp_timestamp, max_wait,
|
|
IsTooManyFramesQueued());
|
|
if (schedule) {
|
|
// Don't schedule if already waiting for the same frame.
|
|
if (frame_decode_scheduler_->ScheduledRtpTimestamp() !=
|
|
decodable_tu_info->next_rtp_timestamp) {
|
|
frame_decode_scheduler_->CancelOutstanding();
|
|
frame_decode_scheduler_->ScheduleFrame(
|
|
decodable_tu_info->next_rtp_timestamp, *schedule,
|
|
absl::bind_front(&VideoStreamBufferController::FrameReadyForDecode,
|
|
this));
|
|
}
|
|
return;
|
|
}
|
|
// If no schedule for current rtp, drop and try again.
|
|
buffer_->DropNextDecodableTemporalUnit();
|
|
decodable_tu_info = buffer_->DecodableTemporalUnitsInfo();
|
|
}
|
|
}
|
|
|
|
} // namespace webrtc
|