mirror of
https://github.com/mollyim/webrtc.git
synced 2025-05-17 23:57:59 +01:00

Bug: webrtc:342905193 No-Try: True Change-Id: Icc968be43b8830038ea9a1f5f604307220457807 Reviewed-on: https://webrtc-review.googlesource.com/c/src/+/361021 Auto-Submit: Florent Castelli <orphis@webrtc.org> Reviewed-by: Harald Alvestrand <hta@webrtc.org> Commit-Queue: Florent Castelli <orphis@webrtc.org> Cr-Commit-Position: refs/heads/main@{#42911}
722 lines
26 KiB
C++
722 lines
26 KiB
C++
/*
|
|
* Copyright (c) 2023 The WebRTC project authors. All Rights Reserved.
|
|
*
|
|
* Use of this source code is governed by a BSD-style license
|
|
* that can be found in the LICENSE file in the root of the source
|
|
* tree. An additional intellectual property rights grant can be found
|
|
* in the file PATENTS. All contributing project authors may
|
|
* be found in the AUTHORS file in the root of the source tree.
|
|
*/
|
|
|
|
#include <string>
|
|
|
|
#include "absl/flags/flag.h"
|
|
#include "absl/flags/parse.h"
|
|
#include "absl/flags/usage.h"
|
|
#include "absl/strings/match.h"
|
|
#include "api/environment/environment.h"
|
|
#include "api/environment/environment_factory.h"
|
|
#include "api/test/create_frame_generator.h"
|
|
#include "api/test/frame_generator_interface.h"
|
|
#include "api/video/builtin_video_bitrate_allocator_factory.h"
|
|
#include "api/video_codecs/builtin_video_decoder_factory.h"
|
|
#include "api/video_codecs/builtin_video_encoder_factory.h"
|
|
#include "common_video/libyuv/include/webrtc_libyuv.h"
|
|
#include "media/base/media_constants.h"
|
|
#include "modules/video_coding/codecs/av1/av1_svc_config.h"
|
|
#include "modules/video_coding/include/video_codec_interface.h"
|
|
#include "modules/video_coding/svc/scalability_mode_util.h"
|
|
#include "rtc_base/logging.h"
|
|
#include "rtc_tools/video_encoder/encoded_image_file_writer.h"
|
|
#include "test/testsupport/y4m_frame_generator.h"
|
|
|
|
ABSL_FLAG(std::string,
|
|
video_codec,
|
|
"",
|
|
"Specify codec of video encoder: vp8, vp9, h264, av1");
|
|
ABSL_FLAG(std::string,
|
|
scalability_mode,
|
|
"L1T1",
|
|
"Specify scalability mode of video encoder");
|
|
|
|
ABSL_FLAG(uint32_t,
|
|
raw_frame_generator,
|
|
0,
|
|
"Specify SquareFrameGenerator or SlideGenerator.\n"
|
|
"0: SquareFrameGenerator, 1: SlideGenerator");
|
|
ABSL_FLAG(uint32_t, width, 1280, "Specify width of video encoder");
|
|
ABSL_FLAG(uint32_t, height, 720, "Specify height of video encoder");
|
|
|
|
ABSL_FLAG(std::string,
|
|
input_file,
|
|
"",
|
|
"Support yuv, y4m and ivf input file of video encoder");
|
|
|
|
ABSL_FLAG(uint32_t, frame_rate_fps, 30, "Specify frame rate of video encoder");
|
|
ABSL_FLAG(uint32_t, bitrate_kbps, 0, "Specify bitrate_kbps of video encoder");
|
|
ABSL_FLAG(uint32_t,
|
|
key_frame_interval,
|
|
3000,
|
|
"Specify key frame interval of video encoder");
|
|
|
|
ABSL_FLAG(uint32_t, frames, 300, "Specify maximum encoded frames");
|
|
|
|
ABSL_FLAG(bool,
|
|
list_formats,
|
|
false,
|
|
"List all supported formats of video encoder");
|
|
|
|
ABSL_FLAG(bool, validate_psnr, false, "Validate PSNR of encoded frames.");
|
|
|
|
ABSL_FLAG(bool, verbose, false, "Verbose logs to stderr");
|
|
|
|
namespace webrtc {
|
|
namespace {
|
|
|
|
[[maybe_unused]] const char* InterLayerPredModeToString(
|
|
const InterLayerPredMode& inter_layer_pred_mode) {
|
|
switch (inter_layer_pred_mode) {
|
|
case InterLayerPredMode::kOff:
|
|
return "Off";
|
|
case InterLayerPredMode::kOn:
|
|
return "On";
|
|
case InterLayerPredMode::kOnKeyPic:
|
|
return "OnKeyPic";
|
|
}
|
|
RTC_CHECK_NOTREACHED();
|
|
return "";
|
|
}
|
|
|
|
std::string ToString(const EncodedImage& encoded_image) {
|
|
char buffer[1024];
|
|
rtc::SimpleStringBuilder ss(buffer);
|
|
|
|
ss << VideoFrameTypeToString(encoded_image._frameType)
|
|
<< ", size=" << encoded_image.size() << ", qp=" << encoded_image.qp_
|
|
<< ", timestamp=" << encoded_image.RtpTimestamp();
|
|
|
|
if (encoded_image.SimulcastIndex()) {
|
|
ss << ", SimulcastIndex=" << *encoded_image.SimulcastIndex();
|
|
}
|
|
|
|
if (encoded_image.SpatialIndex()) {
|
|
ss << ", SpatialIndex=" << *encoded_image.SpatialIndex();
|
|
}
|
|
|
|
if (encoded_image.TemporalIndex()) {
|
|
ss << ", TemporalIndex=" << *encoded_image.TemporalIndex();
|
|
}
|
|
|
|
return ss.str();
|
|
}
|
|
|
|
[[maybe_unused]] std::string ToString(
|
|
const CodecSpecificInfo& codec_specific_info) {
|
|
char buffer[1024];
|
|
rtc::SimpleStringBuilder ss(buffer);
|
|
|
|
ss << CodecTypeToPayloadString(codec_specific_info.codecType);
|
|
|
|
if (codec_specific_info.scalability_mode) {
|
|
ss << ", "
|
|
<< ScalabilityModeToString(*codec_specific_info.scalability_mode);
|
|
}
|
|
|
|
if (codec_specific_info.generic_frame_info) {
|
|
auto& generic_frame_info = codec_specific_info.generic_frame_info;
|
|
|
|
ss << ", decode_target_indications="
|
|
<< generic_frame_info->decode_target_indications.size();
|
|
}
|
|
|
|
if (codec_specific_info.template_structure) {
|
|
auto& template_structure = codec_specific_info.template_structure;
|
|
|
|
ss << ", structure_id=" << template_structure->structure_id
|
|
<< ", num_decode_targets=" << template_structure->num_decode_targets
|
|
<< ", num_chains=" << template_structure->num_chains;
|
|
}
|
|
|
|
return ss.str();
|
|
}
|
|
|
|
// This follows
|
|
// https://source.chromium.org/chromium/chromium/src/+/main:media/gpu/test/video_encoder/video_encoder_test_environment.cc;bpv=1;bpt=1;l=64?q=GetDefaultTargetBitrate&ss=chromium%2Fchromium%2Fsrc
|
|
uint32_t GetDefaultTargetBitrate(const VideoCodecType codec,
|
|
const uint32_t width,
|
|
const uint32_t height,
|
|
const uint32_t framerate,
|
|
bool validation = false) {
|
|
// For how these values are decided, see
|
|
// https://docs.google.com/document/d/1Mlu-2mMOqswWaaivIWhn00dYkoTwKcjLrxxBXcWycug
|
|
constexpr struct {
|
|
int area;
|
|
// bitrate[0]: for speed and quality performance
|
|
// bitrate[1]: for validation.
|
|
// The three values are for H264/VP8, VP9 and AV1, respectively.
|
|
double bitrate[2][3];
|
|
} kBitrateTable[] = {
|
|
{0, {{77.5, 65.0, 60.0}, {100.0, 100.0, 100.0}}},
|
|
{240 * 160, {{77.5, 65.0, 60.0}, {115.0, 100.0, 100.0}}},
|
|
{320 * 240, {{165.0, 105.0, 105.0}, {230.0, 180.0, 180.0}}},
|
|
{480 * 270, {{195.0, 180.0, 180.0}, {320.0, 250, 250}}},
|
|
{640 * 480, {{550.0, 355.0, 342.5}, {690.0, 520, 520}}},
|
|
{1280 * 720, {{1700.0, 990.0, 800.0}, {2500.0, 1500, 1200}}},
|
|
{1920 * 1080, {{2480.0, 2060.0, 1500.0}, {4000.0, 3350.0, 2500.0}}},
|
|
};
|
|
size_t codec_index = 0;
|
|
switch (codec) {
|
|
case webrtc::kVideoCodecVP8:
|
|
case webrtc::kVideoCodecH264:
|
|
codec_index = 0;
|
|
break;
|
|
case webrtc::kVideoCodecVP9:
|
|
codec_index = 1;
|
|
break;
|
|
case webrtc::kVideoCodecAV1:
|
|
codec_index = 2;
|
|
break;
|
|
default:
|
|
RTC_LOG(LS_ERROR) << "Unknown codec: " << codec;
|
|
}
|
|
|
|
const int area = width * height;
|
|
RTC_CHECK(area != 0);
|
|
size_t index = std::size(kBitrateTable) - 1;
|
|
for (size_t i = 0; i < std::size(kBitrateTable); ++i) {
|
|
if (area < kBitrateTable[i].area) {
|
|
index = i;
|
|
break;
|
|
}
|
|
}
|
|
// The target bitrates are based on the bitrate tables in
|
|
// go/meet-codec-strategy, see
|
|
// https://docs.google.com/document/d/1Mlu-2mMOqswWaaivIWhn00dYkoTwKcjLrxxBXcWycug/edit.
|
|
const int low_area = kBitrateTable[index - 1].area;
|
|
const double low_bitrate =
|
|
kBitrateTable[index - 1].bitrate[validation][codec_index];
|
|
const int up_area = kBitrateTable[index].area;
|
|
const double up_bitrate =
|
|
kBitrateTable[index].bitrate[validation][codec_index];
|
|
|
|
const double bitrate_in_30fps_in_kbps =
|
|
(up_bitrate - low_bitrate) / (up_area - low_area) * (area - low_area) +
|
|
low_bitrate;
|
|
// This is selected as 1 in 30fps and 1.8 in 60fps.
|
|
const double framerate_multiplier =
|
|
0.27 * (framerate * framerate / 30.0 / 30.0) + 0.73;
|
|
return bitrate_in_30fps_in_kbps * framerate_multiplier * 1000;
|
|
}
|
|
|
|
// The BitstreamProcessor writes all encoded images into ivf
|
|
// files through `test::EncodedImageFileWriter`, and it will also validate the
|
|
// encoded PSNR if necessary.
|
|
class BitstreamProcessor final : public EncodedImageCallback,
|
|
public DecodedImageCallback {
|
|
public:
|
|
constexpr static double kDefaultPSNRTolerance = 25.0;
|
|
|
|
explicit BitstreamProcessor(const Environment& env,
|
|
const VideoCodec& video_codec_setting,
|
|
bool validate_psnr,
|
|
uint32_t frame_rate_fps,
|
|
uint32_t target_bitrate)
|
|
: video_codec_setting_(video_codec_setting),
|
|
validate_psnr_(validate_psnr),
|
|
frame_rate_fps_(frame_rate_fps),
|
|
target_bitrate_(target_bitrate) {
|
|
writer_ =
|
|
std::make_unique<test::EncodedImageFileWriter>(video_codec_setting);
|
|
|
|
// PSNR validation.
|
|
if (validate_psnr_) {
|
|
const std::string video_codec_string =
|
|
CodecTypeToPayloadString(video_codec_setting.codecType);
|
|
// Create video decoder.
|
|
video_decoder_ = CreateBuiltinVideoDecoderFactory()->Create(
|
|
env, SdpVideoFormat(video_codec_string));
|
|
RTC_CHECK(video_decoder_);
|
|
video_decoder_->Configure({});
|
|
video_decoder_->RegisterDecodeCompleteCallback(this);
|
|
}
|
|
}
|
|
|
|
void ValidatePSNR(webrtc::VideoFrame& frame) {
|
|
RTC_CHECK(validate_psnr_);
|
|
video_decoder_->Decode(*encoded_image_, /*dont_care=*/0);
|
|
double psnr = I420PSNR(*frame.video_frame_buffer()->ToI420(),
|
|
*decode_result_->video_frame_buffer()->ToI420());
|
|
psnr_.push_back(psnr);
|
|
if (psnr < kDefaultPSNRTolerance) {
|
|
RTC_LOG(LS_INFO) << __func__ << " Frame number: " << psnr_.size()
|
|
<< " , the PSNR is too low: " << psnr;
|
|
}
|
|
}
|
|
|
|
bool PSNRPassed() {
|
|
RTC_CHECK(validate_psnr_);
|
|
const uint32_t total_frames = psnr_.size();
|
|
double average_psnr = 0;
|
|
for (const auto& psnr : psnr_) {
|
|
average_psnr += psnr;
|
|
}
|
|
average_psnr /= total_frames;
|
|
|
|
const size_t average_frame_size_in_bits =
|
|
total_encoded_frames_size_ * 8 / total_frames;
|
|
const uint32_t average_bitrate =
|
|
average_frame_size_in_bits * frame_rate_fps_;
|
|
RTC_LOG(LS_INFO) << __func__ << " Average PSNR: " << average_psnr
|
|
<< " Average bitrate: " << average_bitrate
|
|
<< " Bitrate deviation: "
|
|
<< (average_bitrate * 100.0 / target_bitrate_) - 100.0
|
|
<< " %";
|
|
if (average_psnr < kDefaultPSNRTolerance) {
|
|
RTC_LOG(LS_ERROR) << __func__
|
|
<< " Average PSNR is too low: " << average_psnr;
|
|
return false;
|
|
}
|
|
return true;
|
|
}
|
|
|
|
~BitstreamProcessor() = default;
|
|
|
|
private:
|
|
// DecodedImageCallback
|
|
int32_t Decoded(VideoFrame& frame) override {
|
|
decode_result_ = std::make_unique<VideoFrame>(std::move(frame));
|
|
return 0;
|
|
}
|
|
|
|
Result OnEncodedImage(const EncodedImage& encoded_image,
|
|
const CodecSpecificInfo* codec_specific_info) override {
|
|
RTC_LOG(LS_VERBOSE) << "frame " << frames_ << ": {"
|
|
<< ToString(encoded_image)
|
|
<< "}, codec_specific_info: {"
|
|
<< ToString(*codec_specific_info) << "}";
|
|
|
|
RTC_CHECK(writer_);
|
|
writer_->Write(encoded_image);
|
|
|
|
RTC_CHECK(codec_specific_info);
|
|
// For SVC, every picture generates multiple encoded images of different
|
|
// spatial layers.
|
|
if (codec_specific_info->end_of_picture) {
|
|
++frames_;
|
|
}
|
|
|
|
if (validate_psnr_) {
|
|
encoded_image_ = std::make_unique<EncodedImage>(std::move(encoded_image));
|
|
total_encoded_frames_size_ += encoded_image_->size();
|
|
}
|
|
|
|
return Result(Result::Error::OK);
|
|
}
|
|
|
|
VideoCodec video_codec_setting_;
|
|
int32_t frames_ = 0;
|
|
|
|
std::unique_ptr<test::EncodedImageFileWriter> writer_;
|
|
|
|
const bool validate_psnr_ = false;
|
|
const uint32_t frame_rate_fps_ = 0;
|
|
const uint32_t target_bitrate_ = 0;
|
|
size_t total_encoded_frames_size_ = 0;
|
|
std::vector<double> psnr_;
|
|
std::unique_ptr<VideoDecoder> video_decoder_;
|
|
std::unique_ptr<VideoFrame> decode_result_;
|
|
std::unique_ptr<EncodedImage> encoded_image_;
|
|
};
|
|
|
|
// Wrapper of `BuiltinVideoEncoderFactory`.
|
|
class TestVideoEncoderFactoryWrapper final {
|
|
public:
|
|
TestVideoEncoderFactoryWrapper() {
|
|
builtin_video_encoder_factory_ = CreateBuiltinVideoEncoderFactory();
|
|
RTC_CHECK(builtin_video_encoder_factory_);
|
|
}
|
|
|
|
~TestVideoEncoderFactoryWrapper() = default;
|
|
|
|
void ListSupportedFormats() const {
|
|
// Log all supported formats.
|
|
auto formats = builtin_video_encoder_factory_->GetSupportedFormats();
|
|
for (auto& format : formats) {
|
|
RTC_LOG(LS_INFO) << format.ToString();
|
|
}
|
|
}
|
|
|
|
bool QueryCodecSupport(const std::string& video_codec_string,
|
|
const std::string& scalability_mode_string) const {
|
|
RTC_CHECK(!video_codec_string.empty());
|
|
RTC_CHECK(!scalability_mode_string.empty());
|
|
|
|
// Simulcast is not implemented at this moment.
|
|
if (scalability_mode_string[0] == 'S') {
|
|
RTC_LOG(LS_ERROR) << "Not implemented format: "
|
|
<< scalability_mode_string;
|
|
return false;
|
|
}
|
|
|
|
// VP9 profile2 is not implemented at this moment.
|
|
VideoEncoderFactory::CodecSupport support =
|
|
builtin_video_encoder_factory_->QueryCodecSupport(
|
|
SdpVideoFormat(video_codec_string), scalability_mode_string);
|
|
return support.is_supported;
|
|
}
|
|
|
|
VideoCodec CreateVideoCodec(const std::string& video_codec_string,
|
|
const std::string& scalability_mode_string,
|
|
const uint32_t width,
|
|
const uint32_t height,
|
|
const uint32_t frame_rate_fps,
|
|
const uint32_t bitrate_kbps) {
|
|
VideoCodec video_codec = {};
|
|
|
|
VideoCodecType codec_type = PayloadStringToCodecType(video_codec_string);
|
|
RTC_CHECK_NE(codec_type, kVideoCodecGeneric);
|
|
|
|
// Retrieve scalability mode information.
|
|
std::optional<ScalabilityMode> scalability_mode =
|
|
ScalabilityModeFromString(scalability_mode_string);
|
|
RTC_CHECK(scalability_mode);
|
|
|
|
uint32_t spatial_layers =
|
|
ScalabilityModeToNumSpatialLayers(*scalability_mode);
|
|
uint32_t temporal_layers =
|
|
ScalabilityModeToNumTemporalLayers(*scalability_mode);
|
|
InterLayerPredMode inter_layer_pred_mode =
|
|
ScalabilityModeToInterLayerPredMode(*scalability_mode);
|
|
|
|
// Codec settings.
|
|
video_codec.SetScalabilityMode(*scalability_mode);
|
|
video_codec.SetFrameDropEnabled(false);
|
|
video_codec.SetVideoEncoderComplexity(
|
|
VideoCodecComplexity::kComplexityNormal);
|
|
|
|
video_codec.width = width;
|
|
video_codec.height = height;
|
|
video_codec.maxFramerate = frame_rate_fps;
|
|
|
|
video_codec.startBitrate = bitrate_kbps;
|
|
video_codec.maxBitrate = bitrate_kbps;
|
|
video_codec.minBitrate = bitrate_kbps;
|
|
|
|
video_codec.active = true;
|
|
|
|
// Simulcast is not implemented at this moment.
|
|
video_codec.numberOfSimulcastStreams = 0;
|
|
|
|
video_codec.codecType = codec_type;
|
|
// Codec specific settings.
|
|
switch (video_codec.codecType) {
|
|
case kVideoCodecVP8:
|
|
RTC_CHECK_LE(spatial_layers, 1);
|
|
|
|
*(video_codec.VP8()) = VideoEncoder::GetDefaultVp8Settings();
|
|
video_codec.VP8()->numberOfTemporalLayers = temporal_layers;
|
|
video_codec.qpMax = cricket::kDefaultVideoMaxQpVpx;
|
|
break;
|
|
|
|
case kVideoCodecVP9:
|
|
*(video_codec.VP9()) = VideoEncoder::GetDefaultVp9Settings();
|
|
video_codec.VP9()->numberOfSpatialLayers = spatial_layers;
|
|
video_codec.VP9()->numberOfTemporalLayers = temporal_layers;
|
|
video_codec.VP9()->interLayerPred = inter_layer_pred_mode;
|
|
video_codec.qpMax = cricket::kDefaultVideoMaxQpVpx;
|
|
break;
|
|
|
|
case kVideoCodecH264:
|
|
RTC_CHECK_LE(spatial_layers, 1);
|
|
|
|
*(video_codec.H264()) = VideoEncoder::GetDefaultH264Settings();
|
|
video_codec.H264()->numberOfTemporalLayers = temporal_layers;
|
|
video_codec.qpMax = cricket::kDefaultVideoMaxQpH26x;
|
|
break;
|
|
|
|
case kVideoCodecAV1:
|
|
if (SetAv1SvcConfig(video_codec, temporal_layers, spatial_layers)) {
|
|
for (size_t i = 0; i < spatial_layers; ++i) {
|
|
video_codec.spatialLayers[i].active = true;
|
|
}
|
|
} else {
|
|
RTC_LOG(LS_WARNING) << "Failed to configure svc bitrates for av1.";
|
|
}
|
|
video_codec.qpMax = cricket::kDefaultVideoMaxQpVpx;
|
|
break;
|
|
case kVideoCodecH265:
|
|
// TODO(bugs.webrtc.org/13485)
|
|
video_codec.qpMax = cricket::kDefaultVideoMaxQpH26x;
|
|
break;
|
|
default:
|
|
RTC_CHECK_NOTREACHED();
|
|
break;
|
|
}
|
|
|
|
return video_codec;
|
|
}
|
|
|
|
std::unique_ptr<VideoEncoder> CreateAndInitializeVideoEncoder(
|
|
const Environment& env,
|
|
const VideoCodec& video_codec_setting) {
|
|
const std::string video_codec_string =
|
|
CodecTypeToPayloadString(video_codec_setting.codecType);
|
|
const uint32_t bitrate_kbps = video_codec_setting.maxBitrate;
|
|
const uint32_t frame_rate_fps = video_codec_setting.maxFramerate;
|
|
|
|
// Create video encoder.
|
|
std::unique_ptr<VideoEncoder> video_encoder =
|
|
builtin_video_encoder_factory_->Create(
|
|
env, SdpVideoFormat(video_codec_string));
|
|
RTC_CHECK(video_encoder);
|
|
|
|
// Initialize video encoder.
|
|
const webrtc::VideoEncoder::Settings kSettings(
|
|
webrtc::VideoEncoder::Capabilities(false),
|
|
/*number_of_cores=*/1,
|
|
/*max_payload_size=*/0);
|
|
|
|
int ret = video_encoder->InitEncode(&video_codec_setting, kSettings);
|
|
RTC_CHECK_EQ(ret, WEBRTC_VIDEO_CODEC_OK);
|
|
|
|
// Set bitrates.
|
|
std::unique_ptr<VideoBitrateAllocator> bitrate_allocator =
|
|
CreateBuiltinVideoBitrateAllocatorFactory()->Create(
|
|
env, video_codec_setting);
|
|
RTC_CHECK(bitrate_allocator);
|
|
|
|
webrtc::VideoBitrateAllocation allocation =
|
|
bitrate_allocator->GetAllocation(bitrate_kbps * 1000, frame_rate_fps);
|
|
RTC_LOG(LS_INFO) << allocation.ToString();
|
|
|
|
video_encoder->SetRates(webrtc::VideoEncoder::RateControlParameters(
|
|
allocation, frame_rate_fps));
|
|
|
|
return video_encoder;
|
|
}
|
|
|
|
private:
|
|
std::unique_ptr<VideoEncoderFactory> builtin_video_encoder_factory_;
|
|
};
|
|
|
|
} // namespace
|
|
} // namespace webrtc
|
|
|
|
// A video encode tool supports to specify video codec, scalability mode,
|
|
// resolution, frame rate, bitrate, key frame interval and maximum number of
|
|
// frames. The video encoder supports multiple `FrameGeneratorInterface`
|
|
// implementations: `SquareFrameGenerator`, `SlideFrameGenerator`,
|
|
// `YuvFileGenerator`, `Y4mFrameGenerator` and `IvfFileFrameGenerator`. All the
|
|
// encoded bitstreams are wrote into ivf output files.
|
|
int main(int argc, char* argv[]) {
|
|
absl::SetProgramUsageMessage(
|
|
"A video encode tool.\n"
|
|
"\n"
|
|
"Example usage:\n"
|
|
"./video_encoder --list_formats\n"
|
|
"\n"
|
|
"./video_encoder --video_codec=vp8 --width=1280 "
|
|
"--height=720 --bitrate_kbps=1500\n"
|
|
"\n"
|
|
"./video_encoder --raw_frame_generator=1 --video_codec=vp9 "
|
|
"--scalability_mode=L3T3_KEY --width=640 --height=360 "
|
|
"--frame_rate_fps=30 "
|
|
"--bitrate_kbps=500\n"
|
|
"\n"
|
|
"./video_encoder --input_file=input.yuv --video_codec=av1 "
|
|
"--width=640 --height=360 --frames=300 --validate_psnr"
|
|
"--scalability_mode=L1T3 (Note the width and height must match the yuv "
|
|
"file)\n"
|
|
"\n"
|
|
"./video_encoder --input_file=input.y4m --video_codec=av1 "
|
|
"--scalability_mode=L1T3\n"
|
|
"\n"
|
|
"./video_encoder --input_file=input.ivf --video_codec=av1 "
|
|
"--scalability_mode=L1T3\n");
|
|
absl::ParseCommandLine(argc, argv);
|
|
|
|
if (absl::GetFlag(FLAGS_verbose)) {
|
|
rtc::LogMessage::LogToDebug(rtc::LS_VERBOSE);
|
|
} else {
|
|
rtc::LogMessage::LogToDebug(rtc::LS_INFO);
|
|
}
|
|
|
|
rtc::LogMessage::SetLogToStderr(true);
|
|
|
|
const bool list_formats = absl::GetFlag(FLAGS_list_formats);
|
|
const bool validate_psnr = absl::GetFlag(FLAGS_validate_psnr);
|
|
|
|
// Video encoder configurations.
|
|
const std::string video_codec_string = absl::GetFlag(FLAGS_video_codec);
|
|
const std::string scalability_mode_string =
|
|
absl::GetFlag(FLAGS_scalability_mode);
|
|
|
|
const uint32_t width = absl::GetFlag(FLAGS_width);
|
|
const uint32_t height = absl::GetFlag(FLAGS_height);
|
|
|
|
uint32_t raw_frame_generator = absl::GetFlag(FLAGS_raw_frame_generator);
|
|
|
|
const std::string input_file = absl::GetFlag(FLAGS_input_file);
|
|
|
|
const uint32_t frame_rate_fps = absl::GetFlag(FLAGS_frame_rate_fps);
|
|
const uint32_t key_frame_interval = absl::GetFlag(FLAGS_key_frame_interval);
|
|
const uint32_t maximum_number_of_frames = absl::GetFlag(FLAGS_frames);
|
|
uint32_t bitrate_kbps = absl::GetFlag(FLAGS_bitrate_kbps);
|
|
|
|
const webrtc::Environment env = webrtc::CreateEnvironment();
|
|
|
|
std::unique_ptr<webrtc::TestVideoEncoderFactoryWrapper>
|
|
test_video_encoder_factory_wrapper =
|
|
std::make_unique<webrtc::TestVideoEncoderFactoryWrapper>();
|
|
|
|
// List all supported formats.
|
|
if (list_formats) {
|
|
test_video_encoder_factory_wrapper->ListSupportedFormats();
|
|
return EXIT_SUCCESS;
|
|
}
|
|
|
|
if (video_codec_string.empty()) {
|
|
RTC_LOG(LS_ERROR) << "Video codec is empty";
|
|
return EXIT_FAILURE;
|
|
}
|
|
|
|
if (scalability_mode_string.empty()) {
|
|
RTC_LOG(LS_ERROR) << "Scalability mode is empty";
|
|
return EXIT_FAILURE;
|
|
}
|
|
|
|
// Check if the format is supported.
|
|
bool is_supported = test_video_encoder_factory_wrapper->QueryCodecSupport(
|
|
video_codec_string, scalability_mode_string);
|
|
if (!is_supported) {
|
|
RTC_LOG(LS_ERROR) << "Not supported format: video codec "
|
|
<< video_codec_string << ", scalability_mode "
|
|
<< scalability_mode_string;
|
|
return EXIT_FAILURE;
|
|
}
|
|
|
|
// Use the default targit bitrate if the `bitrate_kbps` is not specified.
|
|
if (bitrate_kbps == 0) {
|
|
bitrate_kbps = webrtc::GetDefaultTargetBitrate(
|
|
webrtc::PayloadStringToCodecType(video_codec_string),
|
|
width, height, frame_rate_fps) /
|
|
1000;
|
|
}
|
|
|
|
std::unique_ptr<webrtc::test::FrameGeneratorInterface> frame_buffer_generator;
|
|
if (absl::EndsWith(input_file, ".yuv")) {
|
|
frame_buffer_generator = webrtc::test::CreateFromYuvFileFrameGenerator(
|
|
{input_file}, width, height, /*frame_repeat_count=*/1);
|
|
|
|
RTC_LOG(LS_INFO) << "Create YuvFileGenerator: " << width << "x" << height;
|
|
} else if (absl::EndsWith(input_file, ".y4m")) {
|
|
frame_buffer_generator = std::make_unique<webrtc::test::Y4mFrameGenerator>(
|
|
input_file, webrtc::test::Y4mFrameGenerator::RepeatMode::kLoop);
|
|
|
|
webrtc::test::FrameGeneratorInterface::Resolution resolution =
|
|
frame_buffer_generator->GetResolution();
|
|
if (resolution.width != width || resolution.height != height) {
|
|
frame_buffer_generator->ChangeResolution(width, height);
|
|
}
|
|
|
|
RTC_LOG(LS_INFO) << "Create Y4mFrameGenerator: " << width << "x" << height;
|
|
} else if (absl::EndsWith(input_file, ".ivf")) {
|
|
frame_buffer_generator =
|
|
webrtc::test::CreateFromIvfFileFrameGenerator(env, input_file);
|
|
|
|
// Set width and height.
|
|
webrtc::test::FrameGeneratorInterface::Resolution resolution =
|
|
frame_buffer_generator->GetResolution();
|
|
if (resolution.width != width || resolution.height != height) {
|
|
frame_buffer_generator->ChangeResolution(width, height);
|
|
}
|
|
|
|
RTC_LOG(LS_INFO) << "CreateFromIvfFileFrameGenerator: " << input_file
|
|
<< ", " << width << "x" << height;
|
|
} else {
|
|
RTC_CHECK_LE(raw_frame_generator, 1);
|
|
|
|
if (raw_frame_generator == 0) {
|
|
// Use `SquareFrameGenerator`.
|
|
frame_buffer_generator = webrtc::test::CreateSquareFrameGenerator(
|
|
width, height,
|
|
webrtc::test::FrameGeneratorInterface::OutputType::kI420,
|
|
std::nullopt);
|
|
RTC_CHECK(frame_buffer_generator);
|
|
|
|
RTC_LOG(LS_INFO) << "CreateSquareFrameGenerator: " << width << "x"
|
|
<< height;
|
|
} else {
|
|
// Use `SlideFrameGenerator`.
|
|
const int kFrameRepeatCount = frame_rate_fps;
|
|
frame_buffer_generator = webrtc::test::CreateSlideFrameGenerator(
|
|
width, height, kFrameRepeatCount);
|
|
RTC_CHECK(frame_buffer_generator);
|
|
|
|
RTC_LOG(LS_INFO) << "CreateSlideFrameGenerator: " << width << "x"
|
|
<< height << ", frame_repeat_count "
|
|
<< kFrameRepeatCount;
|
|
}
|
|
}
|
|
|
|
RTC_LOG(LS_INFO) << "Create video encoder, video codec " << video_codec_string
|
|
<< ", scalability mode " << scalability_mode_string << ", "
|
|
<< width << "x" << height << ", frame rate "
|
|
<< frame_rate_fps << ", bitrate_kbps " << bitrate_kbps
|
|
<< ", key frame interval " << key_frame_interval
|
|
<< ", frames " << maximum_number_of_frames
|
|
<< ", validate_psnr " << validate_psnr;
|
|
|
|
// Create and initialize video encoder.
|
|
webrtc::VideoCodec video_codec_setting =
|
|
test_video_encoder_factory_wrapper->CreateVideoCodec(
|
|
video_codec_string, scalability_mode_string, width, height,
|
|
frame_rate_fps, bitrate_kbps);
|
|
|
|
std::unique_ptr<webrtc::VideoEncoder> video_encoder =
|
|
test_video_encoder_factory_wrapper->CreateAndInitializeVideoEncoder(
|
|
env, video_codec_setting);
|
|
RTC_CHECK(video_encoder);
|
|
|
|
// Create `BitstreamProcessor`.
|
|
std::unique_ptr<webrtc::BitstreamProcessor> bitstream_processor =
|
|
std::make_unique<webrtc::BitstreamProcessor>(
|
|
env, video_codec_setting, validate_psnr, frame_rate_fps,
|
|
bitrate_kbps * 1000);
|
|
RTC_CHECK(bitstream_processor);
|
|
int ret =
|
|
video_encoder->RegisterEncodeCompleteCallback(bitstream_processor.get());
|
|
RTC_CHECK_EQ(ret, WEBRTC_VIDEO_CODEC_OK);
|
|
|
|
// Start to encode frames.
|
|
const uint32_t kRtpTick = 90000 / frame_rate_fps;
|
|
// `IvfFileWriter` expects non-zero timestamp for the first frame.
|
|
uint32_t rtp_timestamp = 1;
|
|
for (uint32_t i = 0; i < maximum_number_of_frames; ++i) {
|
|
// Generate key frame for every `key_frame_interval`.
|
|
std::vector<webrtc::VideoFrameType> frame_types = {
|
|
(i % key_frame_interval) ? webrtc::VideoFrameType::kVideoFrameDelta
|
|
: webrtc::VideoFrameType::kVideoFrameKey};
|
|
webrtc::VideoFrame frame =
|
|
webrtc::VideoFrame::Builder()
|
|
.set_video_frame_buffer(frame_buffer_generator->NextFrame().buffer)
|
|
.set_rtp_timestamp(rtp_timestamp)
|
|
.build();
|
|
ret = video_encoder->Encode(frame, &frame_types);
|
|
if (validate_psnr) {
|
|
bitstream_processor->ValidatePSNR(frame);
|
|
}
|
|
RTC_CHECK_EQ(ret, WEBRTC_VIDEO_CODEC_OK);
|
|
|
|
rtp_timestamp += kRtpTick;
|
|
}
|
|
|
|
// Cleanup.
|
|
video_encoder->Release();
|
|
|
|
if (validate_psnr && !bitstream_processor->PSNRPassed()) {
|
|
return EXIT_FAILURE;
|
|
}
|
|
|
|
return EXIT_SUCCESS;
|
|
}
|