unplugged-system/external/libvpx/test/vp9_ratectrl_rtc_test.cc

517 lines
18 KiB
C++

/*
* Copyright (c) 2020 The WebM project authors. All Rights Reserved.
*
* Use of this source code is governed by a BSD-style license
* that can be found in the LICENSE file in the root of the source
* tree. An additional intellectual property rights grant can be found
* in the file PATENTS. All contributing project authors may
* be found in the AUTHORS file in the root of the source tree.
*/
#include "vp9/ratectrl_rtc.h"
#include <fstream> // NOLINT
#include <string>
#include "./vpx_config.h"
#include "third_party/googletest/src/include/gtest/gtest.h"
#include "test/codec_factory.h"
#include "test/encode_test_driver.h"
#include "test/i420_video_source.h"
#include "test/util.h"
#include "test/video_source.h"
#include "vpx/vpx_codec.h"
#include "vpx_ports/bitops.h"
namespace {
const size_t kNumFrames = 300;
const int kTemporalId3Layer[4] = { 0, 2, 1, 2 };
const int kTemporalId2Layer[2] = { 0, 1 };
const int kTemporalRateAllocation3Layer[3] = { 50, 70, 100 };
const int kTemporalRateAllocation2Layer[2] = { 60, 100 };
const int kSpatialLayerBitrate[3] = { 200, 400, 1000 };
class RcInterfaceTest
: public ::libvpx_test::EncoderTest,
public ::libvpx_test::CodecTestWith2Params<int, vpx_rc_mode> {
public:
RcInterfaceTest()
: EncoderTest(GET_PARAM(0)), aq_mode_(GET_PARAM(1)), key_interval_(3000),
encoder_exit_(false) {}
virtual ~RcInterfaceTest() {}
protected:
virtual void SetUp() {
InitializeConfig();
SetMode(::libvpx_test::kRealTime);
}
virtual void PreEncodeFrameHook(libvpx_test::VideoSource *video,
libvpx_test::Encoder *encoder) {
if (video->frame() == 0) {
encoder->Control(VP8E_SET_CPUUSED, 7);
encoder->Control(VP9E_SET_AQ_MODE, aq_mode_);
encoder->Control(VP9E_SET_TUNE_CONTENT, 0);
encoder->Control(VP8E_SET_MAX_INTRA_BITRATE_PCT, 1000);
encoder->Control(VP9E_SET_RTC_EXTERNAL_RATECTRL, 1);
}
frame_params_.frame_type =
video->frame() % key_interval_ == 0 ? KEY_FRAME : INTER_FRAME;
if (rc_cfg_.rc_mode == VPX_CBR && frame_params_.frame_type == INTER_FRAME) {
// Disable golden frame update.
frame_flags_ |= VP8_EFLAG_NO_UPD_GF;
frame_flags_ |= VP8_EFLAG_NO_UPD_ARF;
}
encoder_exit_ = video->frame() == kNumFrames;
}
virtual void PostEncodeFrameHook(::libvpx_test::Encoder *encoder) {
if (encoder_exit_) {
return;
}
int loopfilter_level, qp;
encoder->Control(VP9E_GET_LOOPFILTER_LEVEL, &loopfilter_level);
encoder->Control(VP8E_GET_LAST_QUANTIZER, &qp);
rc_api_->ComputeQP(frame_params_);
ASSERT_EQ(rc_api_->GetQP(), qp);
ASSERT_EQ(rc_api_->GetLoopfilterLevel(), loopfilter_level);
}
virtual void FramePktHook(const vpx_codec_cx_pkt_t *pkt) {
rc_api_->PostEncodeUpdate(pkt->data.frame.sz);
}
void RunOneLayer() {
SetConfig(GET_PARAM(2));
rc_api_ = libvpx::VP9RateControlRTC::Create(rc_cfg_);
frame_params_.spatial_layer_id = 0;
frame_params_.temporal_layer_id = 0;
::libvpx_test::I420VideoSource video("desktop_office1.1280_720-020.yuv",
1280, 720, 30, 1, 0, kNumFrames);
ASSERT_NO_FATAL_FAILURE(RunLoop(&video));
}
void RunOneLayerVBRPeriodicKey() {
if (GET_PARAM(2) != VPX_VBR) return;
key_interval_ = 100;
SetConfig(VPX_VBR);
rc_api_ = libvpx::VP9RateControlRTC::Create(rc_cfg_);
frame_params_.spatial_layer_id = 0;
frame_params_.temporal_layer_id = 0;
::libvpx_test::I420VideoSource video("desktop_office1.1280_720-020.yuv",
1280, 720, 30, 1, 0, kNumFrames);
ASSERT_NO_FATAL_FAILURE(RunLoop(&video));
}
private:
void SetConfig(vpx_rc_mode rc_mode) {
rc_cfg_.width = 1280;
rc_cfg_.height = 720;
rc_cfg_.max_quantizer = 52;
rc_cfg_.min_quantizer = 2;
rc_cfg_.target_bandwidth = 1000;
rc_cfg_.buf_initial_sz = 600;
rc_cfg_.buf_optimal_sz = 600;
rc_cfg_.buf_sz = 1000;
rc_cfg_.undershoot_pct = 50;
rc_cfg_.overshoot_pct = 50;
rc_cfg_.max_intra_bitrate_pct = 1000;
rc_cfg_.framerate = 30.0;
rc_cfg_.ss_number_layers = 1;
rc_cfg_.ts_number_layers = 1;
rc_cfg_.scaling_factor_num[0] = 1;
rc_cfg_.scaling_factor_den[0] = 1;
rc_cfg_.layer_target_bitrate[0] = 1000;
rc_cfg_.max_quantizers[0] = 52;
rc_cfg_.min_quantizers[0] = 2;
rc_cfg_.rc_mode = rc_mode;
rc_cfg_.aq_mode = aq_mode_;
// Encoder settings for ground truth.
cfg_.g_w = 1280;
cfg_.g_h = 720;
cfg_.rc_undershoot_pct = 50;
cfg_.rc_overshoot_pct = 50;
cfg_.rc_buf_initial_sz = 600;
cfg_.rc_buf_optimal_sz = 600;
cfg_.rc_buf_sz = 1000;
cfg_.rc_dropframe_thresh = 0;
cfg_.rc_min_quantizer = 2;
cfg_.rc_max_quantizer = 52;
cfg_.rc_end_usage = rc_mode;
cfg_.g_lag_in_frames = 0;
cfg_.g_error_resilient = 0;
cfg_.rc_target_bitrate = 1000;
cfg_.kf_min_dist = key_interval_;
cfg_.kf_max_dist = key_interval_;
}
std::unique_ptr<libvpx::VP9RateControlRTC> rc_api_;
libvpx::VP9RateControlRtcConfig rc_cfg_;
int aq_mode_;
int key_interval_;
libvpx::VP9FrameParamsQpRTC frame_params_;
bool encoder_exit_;
};
class RcInterfaceSvcTest : public ::libvpx_test::EncoderTest,
public ::libvpx_test::CodecTestWithParam<int> {
public:
RcInterfaceSvcTest() : EncoderTest(GET_PARAM(0)), aq_mode_(GET_PARAM(1)) {}
virtual ~RcInterfaceSvcTest() {}
protected:
virtual void SetUp() {
InitializeConfig();
SetMode(::libvpx_test::kRealTime);
}
virtual void PreEncodeFrameHook(libvpx_test::VideoSource *video,
::libvpx_test::Encoder *encoder) {
if (video->frame() == 0) {
encoder->Control(VP8E_SET_CPUUSED, 7);
encoder->Control(VP9E_SET_AQ_MODE, aq_mode_);
encoder->Control(VP9E_SET_TUNE_CONTENT, 0);
encoder->Control(VP8E_SET_MAX_INTRA_BITRATE_PCT, 900);
encoder->Control(VP9E_SET_RTC_EXTERNAL_RATECTRL, 1);
encoder->Control(VP9E_SET_SVC, 1);
encoder->Control(VP9E_SET_SVC_PARAMETERS, &svc_params_);
}
frame_params_.frame_type =
video->frame() % key_interval_ == 0 ? KEY_FRAME : INTER_FRAME;
encoder_exit_ = video->frame() == kNumFrames;
current_superframe_ = video->frame();
if (dynamic_spatial_layers_ == 1) {
if (video->frame() == 100) {
// Go down to 2 spatial layers: set top SL to 0 bitrate.
// Update the encoder config.
cfg_.rc_target_bitrate -= cfg_.layer_target_bitrate[8];
cfg_.layer_target_bitrate[6] = 0;
cfg_.layer_target_bitrate[7] = 0;
cfg_.layer_target_bitrate[8] = 0;
encoder->Config(&cfg_);
// Update the RC config.
rc_cfg_.target_bandwidth -= rc_cfg_.layer_target_bitrate[8];
rc_cfg_.layer_target_bitrate[6] = 0;
rc_cfg_.layer_target_bitrate[7] = 0;
rc_cfg_.layer_target_bitrate[8] = 0;
rc_api_->UpdateRateControl(rc_cfg_);
} else if (video->frame() == 200) {
// Go down to 1 spatial layer.
// Update the encoder config.
cfg_.rc_target_bitrate -= cfg_.layer_target_bitrate[5];
cfg_.layer_target_bitrate[3] = 0;
cfg_.layer_target_bitrate[4] = 0;
cfg_.layer_target_bitrate[5] = 0;
encoder->Config(&cfg_);
// Update the RC config.
rc_cfg_.target_bandwidth -= rc_cfg_.layer_target_bitrate[5];
rc_cfg_.layer_target_bitrate[3] = 0;
rc_cfg_.layer_target_bitrate[4] = 0;
rc_cfg_.layer_target_bitrate[5] = 0;
rc_api_->UpdateRateControl(rc_cfg_);
} else if (0 && video->frame() == 280) {
// TODO(marpan): Re-enable this going back up when issue is fixed.
// Go back up to 3 spatial layers.
// Update the encoder config: use the original bitrates.
SetEncoderConfigSvc(3, 3);
encoder->Config(&cfg_);
// Update the RC config.
SetRCConfigSvc(3, 3);
rc_api_->UpdateRateControl(rc_cfg_);
}
}
}
virtual void PostEncodeFrameHook(::libvpx_test::Encoder *encoder) {
::libvpx_test::CxDataIterator iter = encoder->GetCxData();
for (int sl = 0; sl < rc_cfg_.ss_number_layers; sl++) sizes_[sl] = 0;
while (const vpx_codec_cx_pkt_t *pkt = iter.Next()) {
ParseSuperframeSizes(static_cast<const uint8_t *>(pkt->data.frame.buf),
pkt->data.frame.sz);
for (int sl = 0; sl < rc_cfg_.ss_number_layers; sl++) {
if (sizes_[sl] > 0) {
frame_params_.spatial_layer_id = sl;
if (rc_cfg_.ts_number_layers == 3)
frame_params_.temporal_layer_id =
kTemporalId3Layer[current_superframe_ % 4];
else if (rc_cfg_.ts_number_layers == 2)
frame_params_.temporal_layer_id =
kTemporalId2Layer[current_superframe_ % 2];
else
frame_params_.temporal_layer_id = 0;
rc_api_->ComputeQP(frame_params_);
frame_params_.frame_type = INTER_FRAME;
rc_api_->PostEncodeUpdate(sizes_[sl]);
}
}
}
if (!encoder_exit_) {
int loopfilter_level, qp;
encoder->Control(VP9E_GET_LOOPFILTER_LEVEL, &loopfilter_level);
encoder->Control(VP8E_GET_LAST_QUANTIZER, &qp);
ASSERT_EQ(rc_api_->GetQP(), qp);
ASSERT_EQ(rc_api_->GetLoopfilterLevel(), loopfilter_level);
}
}
// This method needs to be overridden because non-reference frames are
// expected to be mismatched frames as the encoder will avoid loopfilter on
// these frames.
virtual void MismatchHook(const vpx_image_t * /*img1*/,
const vpx_image_t * /*img2*/) {}
void RunSvc() {
dynamic_spatial_layers_ = 0;
SetRCConfigSvc(3, 3);
key_interval_ = 10000;
rc_api_ = libvpx::VP9RateControlRTC::Create(rc_cfg_);
SetEncoderConfigSvc(3, 3);
::libvpx_test::I420VideoSource video("desktop_office1.1280_720-020.yuv",
1280, 720, 30, 1, 0, kNumFrames);
ASSERT_NO_FATAL_FAILURE(RunLoop(&video));
}
void RunSvcPeriodicKey() {
dynamic_spatial_layers_ = 0;
SetRCConfigSvc(3, 3);
key_interval_ = 100;
rc_api_ = libvpx::VP9RateControlRTC::Create(rc_cfg_);
SetEncoderConfigSvc(3, 3);
::libvpx_test::I420VideoSource video("desktop_office1.1280_720-020.yuv",
1280, 720, 30, 1, 0, kNumFrames);
ASSERT_NO_FATAL_FAILURE(RunLoop(&video));
}
void RunSvcDynamicSpatial() {
dynamic_spatial_layers_ = 1;
SetRCConfigSvc(3, 3);
key_interval_ = 10000;
rc_api_ = libvpx::VP9RateControlRTC::Create(rc_cfg_);
SetEncoderConfigSvc(3, 3);
::libvpx_test::I420VideoSource video("desktop_office1.1280_720-020.yuv",
1280, 720, 30, 1, 0, kNumFrames);
ASSERT_NO_FATAL_FAILURE(RunLoop(&video));
}
private:
vpx_codec_err_t ParseSuperframeSizes(const uint8_t *data, size_t data_sz) {
uint8_t marker = *(data + data_sz - 1);
if ((marker & 0xe0) == 0xc0) {
const uint32_t frames = (marker & 0x7) + 1;
const uint32_t mag = ((marker >> 3) & 0x3) + 1;
const size_t index_sz = 2 + mag * frames;
// This chunk is marked as having a superframe index but doesn't have
// enough data for it, thus it's an invalid superframe index.
if (data_sz < index_sz) return VPX_CODEC_CORRUPT_FRAME;
{
const uint8_t marker2 = *(data + data_sz - index_sz);
// This chunk is marked as having a superframe index but doesn't have
// the matching marker byte at the front of the index therefore it's an
// invalid chunk.
if (marker != marker2) return VPX_CODEC_CORRUPT_FRAME;
}
const uint8_t *x = &data[data_sz - index_sz + 1];
for (uint32_t i = 0; i < frames; ++i) {
uint32_t this_sz = 0;
for (uint32_t j = 0; j < mag; ++j) this_sz |= (*x++) << (j * 8);
sizes_[i] = this_sz;
}
}
return VPX_CODEC_OK;
}
void SetEncoderConfigSvc(int number_spatial_layers,
int number_temporal_layers) {
cfg_.g_w = 1280;
cfg_.g_h = 720;
cfg_.ss_number_layers = number_spatial_layers;
cfg_.ts_number_layers = number_temporal_layers;
cfg_.g_timebase.num = 1;
cfg_.g_timebase.den = 30;
if (number_spatial_layers == 3) {
svc_params_.scaling_factor_num[0] = 1;
svc_params_.scaling_factor_den[0] = 4;
svc_params_.scaling_factor_num[1] = 2;
svc_params_.scaling_factor_den[1] = 4;
svc_params_.scaling_factor_num[2] = 4;
svc_params_.scaling_factor_den[2] = 4;
} else if (number_spatial_layers == 2) {
svc_params_.scaling_factor_num[0] = 1;
svc_params_.scaling_factor_den[0] = 2;
svc_params_.scaling_factor_num[1] = 2;
svc_params_.scaling_factor_den[1] = 2;
} else if (number_spatial_layers == 1) {
svc_params_.scaling_factor_num[0] = 1;
svc_params_.scaling_factor_den[0] = 1;
}
for (int i = 0; i < VPX_MAX_LAYERS; ++i) {
svc_params_.max_quantizers[i] = 56;
svc_params_.min_quantizers[i] = 2;
svc_params_.speed_per_layer[i] = 7;
svc_params_.loopfilter_ctrl[i] = LOOPFILTER_ALL;
}
cfg_.rc_end_usage = VPX_CBR;
cfg_.g_lag_in_frames = 0;
cfg_.g_error_resilient = 0;
if (number_temporal_layers == 3) {
cfg_.ts_rate_decimator[0] = 4;
cfg_.ts_rate_decimator[1] = 2;
cfg_.ts_rate_decimator[2] = 1;
cfg_.temporal_layering_mode = 3;
} else if (number_temporal_layers == 2) {
cfg_.ts_rate_decimator[0] = 2;
cfg_.ts_rate_decimator[1] = 1;
cfg_.temporal_layering_mode = 2;
} else if (number_temporal_layers == 1) {
cfg_.ts_rate_decimator[0] = 1;
cfg_.temporal_layering_mode = 0;
}
cfg_.rc_buf_initial_sz = 500;
cfg_.rc_buf_optimal_sz = 600;
cfg_.rc_buf_sz = 1000;
cfg_.rc_min_quantizer = 2;
cfg_.rc_max_quantizer = 56;
cfg_.g_threads = 1;
cfg_.kf_max_dist = 9999;
cfg_.rc_overshoot_pct = 50;
cfg_.rc_undershoot_pct = 50;
cfg_.rc_target_bitrate = 0;
for (int sl = 0; sl < number_spatial_layers; sl++) {
int spatial_bitrate = 0;
if (number_spatial_layers <= 3)
spatial_bitrate = kSpatialLayerBitrate[sl];
for (int tl = 0; tl < number_temporal_layers; tl++) {
int layer = sl * number_temporal_layers + tl;
if (number_temporal_layers == 3)
cfg_.layer_target_bitrate[layer] =
kTemporalRateAllocation3Layer[tl] * spatial_bitrate / 100;
else if (number_temporal_layers == 2)
cfg_.layer_target_bitrate[layer] =
kTemporalRateAllocation2Layer[tl] * spatial_bitrate / 100;
else if (number_temporal_layers == 1)
cfg_.layer_target_bitrate[layer] = spatial_bitrate;
}
cfg_.rc_target_bitrate += spatial_bitrate;
}
cfg_.kf_min_dist = key_interval_;
cfg_.kf_max_dist = key_interval_;
}
void SetRCConfigSvc(int number_spatial_layers, int number_temporal_layers) {
rc_cfg_.width = 1280;
rc_cfg_.height = 720;
rc_cfg_.ss_number_layers = number_spatial_layers;
rc_cfg_.ts_number_layers = number_temporal_layers;
rc_cfg_.max_quantizer = 56;
rc_cfg_.min_quantizer = 2;
rc_cfg_.buf_initial_sz = 500;
rc_cfg_.buf_optimal_sz = 600;
rc_cfg_.buf_sz = 1000;
rc_cfg_.undershoot_pct = 50;
rc_cfg_.overshoot_pct = 50;
rc_cfg_.max_intra_bitrate_pct = 900;
rc_cfg_.framerate = 30.0;
rc_cfg_.rc_mode = VPX_CBR;
rc_cfg_.aq_mode = aq_mode_;
if (number_spatial_layers == 3) {
rc_cfg_.scaling_factor_num[0] = 1;
rc_cfg_.scaling_factor_den[0] = 4;
rc_cfg_.scaling_factor_num[1] = 2;
rc_cfg_.scaling_factor_den[1] = 4;
rc_cfg_.scaling_factor_num[2] = 4;
rc_cfg_.scaling_factor_den[2] = 4;
} else if (number_spatial_layers == 2) {
rc_cfg_.scaling_factor_num[0] = 1;
rc_cfg_.scaling_factor_den[0] = 2;
rc_cfg_.scaling_factor_num[1] = 2;
rc_cfg_.scaling_factor_den[1] = 2;
} else if (number_spatial_layers == 1) {
rc_cfg_.scaling_factor_num[0] = 1;
rc_cfg_.scaling_factor_den[0] = 1;
}
if (number_temporal_layers == 3) {
rc_cfg_.ts_rate_decimator[0] = 4;
rc_cfg_.ts_rate_decimator[1] = 2;
rc_cfg_.ts_rate_decimator[2] = 1;
} else if (number_temporal_layers == 2) {
rc_cfg_.ts_rate_decimator[0] = 2;
rc_cfg_.ts_rate_decimator[1] = 1;
} else if (number_temporal_layers == 1) {
rc_cfg_.ts_rate_decimator[0] = 1;
}
rc_cfg_.target_bandwidth = 0;
for (int sl = 0; sl < number_spatial_layers; sl++) {
int spatial_bitrate = 0;
if (number_spatial_layers <= 3)
spatial_bitrate = kSpatialLayerBitrate[sl];
for (int tl = 0; tl < number_temporal_layers; tl++) {
int layer = sl * number_temporal_layers + tl;
if (number_temporal_layers == 3)
rc_cfg_.layer_target_bitrate[layer] =
kTemporalRateAllocation3Layer[tl] * spatial_bitrate / 100;
else if (number_temporal_layers == 2)
rc_cfg_.layer_target_bitrate[layer] =
kTemporalRateAllocation2Layer[tl] * spatial_bitrate / 100;
else if (number_temporal_layers == 1)
rc_cfg_.layer_target_bitrate[layer] = spatial_bitrate;
}
rc_cfg_.target_bandwidth += spatial_bitrate;
}
for (int sl = 0; sl < rc_cfg_.ss_number_layers; ++sl) {
for (int tl = 0; tl < rc_cfg_.ts_number_layers; ++tl) {
const int i = sl * rc_cfg_.ts_number_layers + tl;
rc_cfg_.max_quantizers[i] = 56;
rc_cfg_.min_quantizers[i] = 2;
}
}
}
int aq_mode_;
std::unique_ptr<libvpx::VP9RateControlRTC> rc_api_;
libvpx::VP9RateControlRtcConfig rc_cfg_;
vpx_svc_extra_cfg_t svc_params_;
libvpx::VP9FrameParamsQpRTC frame_params_;
bool encoder_exit_;
int current_superframe_;
uint32_t sizes_[8];
int key_interval_;
int dynamic_spatial_layers_;
};
TEST_P(RcInterfaceTest, OneLayer) { RunOneLayer(); }
TEST_P(RcInterfaceTest, OneLayerVBRPeriodicKey) { RunOneLayerVBRPeriodicKey(); }
TEST_P(RcInterfaceSvcTest, Svc) { RunSvc(); }
TEST_P(RcInterfaceSvcTest, SvcPeriodicKey) { RunSvcPeriodicKey(); }
TEST_P(RcInterfaceSvcTest, SvcDynamicSpatial) { RunSvcDynamicSpatial(); }
VP9_INSTANTIATE_TEST_SUITE(RcInterfaceTest, ::testing::Values(0, 3),
::testing::Values(VPX_CBR, VPX_VBR));
VP9_INSTANTIATE_TEST_SUITE(RcInterfaceSvcTest, ::testing::Values(0, 3));
} // namespace