303 lines
12 KiB
C++
303 lines
12 KiB
C++
/*
|
|
* Copyright (c) 2017 The WebM project authors. All Rights Reserved.
|
|
* Copyright (c) 2024, Alliance for Open Media. All rights reserved.
|
|
*
|
|
* Use of this source code is governed by a BSD-style license
|
|
* that can be found in the LICENSE file in the root of the source
|
|
* tree. An additional intellectual property rights grant can be found
|
|
* in the file PATENTS. All contributing project authors may
|
|
* be found in the AUTHORS file in the root of the source tree.
|
|
*/
|
|
|
|
#include <assert.h>
|
|
#include <string.h>
|
|
|
|
#include <tuple>
|
|
|
|
#include "gtest/gtest.h"
|
|
|
|
#include "common/av1_config.h"
|
|
#include "config/av1_rtcd.h"
|
|
|
|
#include "config/aom_config.h"
|
|
#include "config/aom_dsp_rtcd.h"
|
|
|
|
#include "aom_dsp/aom_dsp_common.h"
|
|
#include "aom_dsp/aom_filter.h"
|
|
#include "aom_mem/aom_mem.h"
|
|
#include "aom_ports/aom_timer.h"
|
|
#include "aom_ports/mem.h"
|
|
#include "av1/common/filter.h"
|
|
#include "test/acm_random.h"
|
|
#include "test/register_state_check.h"
|
|
#include "test/util.h"
|
|
|
|
namespace {
|
|
|
|
using ResizeFrameFunc = void (*)(const YV12_BUFFER_CONFIG *src,
|
|
YV12_BUFFER_CONFIG *dst,
|
|
const InterpFilter filter, const int phase,
|
|
const int num_planes);
|
|
|
|
class ResizeAndExtendTest : public ::testing::TestWithParam<ResizeFrameFunc> {
|
|
public:
|
|
ResizeAndExtendTest() { resize_fn_ = GetParam(); }
|
|
~ResizeAndExtendTest() override = default;
|
|
|
|
protected:
|
|
const int kBufFiller = 123;
|
|
const int kBufMax = kBufFiller - 1;
|
|
|
|
void FillPlane(uint8_t *const buf, const int width, const int height,
|
|
const int stride) {
|
|
for (int y = 0; y < height; ++y) {
|
|
for (int x = 0; x < width; ++x) {
|
|
buf[x + (y * stride)] = (x + (width * y)) % kBufMax;
|
|
}
|
|
}
|
|
}
|
|
|
|
void ResetResizeImage(YV12_BUFFER_CONFIG *const img, const int width,
|
|
const int height, const int border) {
|
|
memset(img, 0, sizeof(*img));
|
|
ASSERT_EQ(0, aom_alloc_frame_buffer(img, width, height, 1, 1, 0, border, 16,
|
|
false, 0));
|
|
memset(img->buffer_alloc, kBufFiller, img->frame_size);
|
|
}
|
|
|
|
void ResetResizeImages(const int src_width, const int src_height,
|
|
const int dst_width, const int dst_height,
|
|
const int dst_border) {
|
|
ResetResizeImage(&img_, src_width, src_height, AOM_BORDER_IN_PIXELS);
|
|
ResetResizeImage(&ref_img_, dst_width, dst_height, dst_border);
|
|
ResetResizeImage(&dst_img_, dst_width, dst_height, dst_border);
|
|
FillPlane(img_.y_buffer, img_.y_crop_width, img_.y_crop_height,
|
|
img_.y_stride);
|
|
FillPlane(img_.u_buffer, img_.uv_crop_width, img_.uv_crop_height,
|
|
img_.uv_stride);
|
|
FillPlane(img_.v_buffer, img_.uv_crop_width, img_.uv_crop_height,
|
|
img_.uv_stride);
|
|
}
|
|
|
|
void DeallocResizeImages() {
|
|
aom_free_frame_buffer(&img_);
|
|
aom_free_frame_buffer(&ref_img_);
|
|
aom_free_frame_buffer(&dst_img_);
|
|
}
|
|
|
|
void RunTest(InterpFilter filter_type) {
|
|
static const int kNumSizesToTest = 22;
|
|
static const int kNumScaleFactorsToTest = 4;
|
|
static const int kNumDstBordersToTest = 2;
|
|
static const int kSizesToTest[] = { 1, 2, 3, 4, 6, 8, 10, 12,
|
|
14, 16, 18, 20, 22, 24, 26, 28,
|
|
30, 32, 34, 68, 128, 134 };
|
|
static const int kScaleFactors[] = { 1, 2, 3, 4 };
|
|
static const int kDstBorders[] = { 0, AOM_BORDER_IN_PIXELS };
|
|
for (int border = 0; border < kNumDstBordersToTest; ++border) {
|
|
const int dst_border = kDstBorders[border];
|
|
for (int phase_scaler = 0; phase_scaler < 16; ++phase_scaler) {
|
|
for (int h = 0; h < kNumSizesToTest; ++h) {
|
|
const int src_height = kSizesToTest[h];
|
|
for (int w = 0; w < kNumSizesToTest; ++w) {
|
|
const int src_width = kSizesToTest[w];
|
|
for (int sf_up_idx = 0; sf_up_idx < kNumScaleFactorsToTest;
|
|
++sf_up_idx) {
|
|
const int sf_up = kScaleFactors[sf_up_idx];
|
|
for (int sf_down_idx = 0; sf_down_idx < kNumScaleFactorsToTest;
|
|
++sf_down_idx) {
|
|
const int sf_down = kScaleFactors[sf_down_idx];
|
|
const int dst_width = src_width * sf_up / sf_down;
|
|
const int dst_height = src_height * sf_up / sf_down;
|
|
// TODO: bug aomedia:363916152 - Enable unit tests for 4 to 3
|
|
// scaling when Neon and SSSE3 implementation of
|
|
// av1_resize_and_extend_frame do not differ from scalar version
|
|
if (sf_down == 4 && sf_up == 3) {
|
|
continue;
|
|
}
|
|
|
|
if (sf_up == sf_down && sf_up != 1) {
|
|
continue;
|
|
}
|
|
// I420 frame width and height must be even.
|
|
if (!dst_width || !dst_height || dst_width & 1 ||
|
|
dst_height & 1) {
|
|
continue;
|
|
}
|
|
// aom_convolve8_c() has restriction on the step which cannot
|
|
// exceed 64 (ratio 1 to 4).
|
|
if (src_width > 4 * dst_width || src_height > 4 * dst_height) {
|
|
continue;
|
|
}
|
|
ASSERT_NO_FATAL_FAILURE(ResetResizeImages(
|
|
src_width, src_height, dst_width, dst_height, dst_border));
|
|
|
|
av1_resize_and_extend_frame_c(&img_, &ref_img_, filter_type,
|
|
phase_scaler, 1);
|
|
resize_fn_(&img_, &dst_img_, filter_type, phase_scaler, 1);
|
|
|
|
if (memcmp(dst_img_.buffer_alloc, ref_img_.buffer_alloc,
|
|
ref_img_.frame_size)) {
|
|
printf(
|
|
"filter_type = %d, phase_scaler = %d, src_width = %4d, "
|
|
"src_height = %4d, dst_width = %4d, dst_height = %4d, "
|
|
"scale factor = %d:%d\n",
|
|
filter_type, phase_scaler, src_width, src_height,
|
|
dst_width, dst_height, sf_down, sf_up);
|
|
PrintDiff();
|
|
}
|
|
|
|
EXPECT_EQ(ref_img_.frame_size, dst_img_.frame_size);
|
|
EXPECT_EQ(0,
|
|
memcmp(ref_img_.buffer_alloc, dst_img_.buffer_alloc,
|
|
ref_img_.frame_size));
|
|
|
|
DeallocResizeImages();
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
void PrintDiffComponent(const uint8_t *const ref, const uint8_t *const opt,
|
|
const int stride, const int width, const int height,
|
|
const int plane_idx) const {
|
|
for (int y = 0; y < height; y++) {
|
|
for (int x = 0; x < width; x++) {
|
|
if (ref[y * stride + x] != opt[y * stride + x]) {
|
|
printf("Plane %d pixel[%d][%d] diff:%6d (ref),%6d (opt)\n", plane_idx,
|
|
y, x, ref[y * stride + x], opt[y * stride + x]);
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
void PrintDiff() const {
|
|
assert(ref_img_.y_stride == dst_img_.y_stride);
|
|
assert(ref_img_.y_width == dst_img_.y_width);
|
|
assert(ref_img_.y_height == dst_img_.y_height);
|
|
assert(ref_img_.uv_stride == dst_img_.uv_stride);
|
|
assert(ref_img_.uv_width == dst_img_.uv_width);
|
|
assert(ref_img_.uv_height == dst_img_.uv_height);
|
|
|
|
if (memcmp(dst_img_.buffer_alloc, ref_img_.buffer_alloc,
|
|
ref_img_.frame_size)) {
|
|
PrintDiffComponent(ref_img_.y_buffer, dst_img_.y_buffer,
|
|
ref_img_.y_stride, ref_img_.y_width, ref_img_.y_height,
|
|
0);
|
|
PrintDiffComponent(ref_img_.u_buffer, dst_img_.u_buffer,
|
|
ref_img_.uv_stride, ref_img_.uv_width,
|
|
ref_img_.uv_height, 1);
|
|
PrintDiffComponent(ref_img_.v_buffer, dst_img_.v_buffer,
|
|
ref_img_.uv_stride, ref_img_.uv_width,
|
|
ref_img_.uv_height, 2);
|
|
}
|
|
}
|
|
|
|
void SpeedTest() {
|
|
static const int kCountSpeedTestBlock = 100;
|
|
static const int kNumScaleFactorsToTest = 4;
|
|
static const int kNumInterpFiltersToTest = 3;
|
|
static const int kScaleFactors[] = { 1, 2, 3, 4 };
|
|
static const int kInterpFilters[] = { 0, 1, 3 };
|
|
const int src_width = 1280;
|
|
const int src_height = 720;
|
|
for (int filter = 0; filter < kNumInterpFiltersToTest; ++filter) {
|
|
const InterpFilter filter_type =
|
|
static_cast<InterpFilter>(kInterpFilters[filter]);
|
|
for (int phase_scaler = 0; phase_scaler < 2; ++phase_scaler) {
|
|
for (int sf_up_idx = 0; sf_up_idx < kNumScaleFactorsToTest;
|
|
++sf_up_idx) {
|
|
const int sf_up = kScaleFactors[sf_up_idx];
|
|
for (int sf_down_idx = 0; sf_down_idx < kNumScaleFactorsToTest;
|
|
++sf_down_idx) {
|
|
const int sf_down = kScaleFactors[sf_down_idx];
|
|
const int dst_width = src_width * sf_up / sf_down;
|
|
const int dst_height = src_height * sf_up / sf_down;
|
|
// TODO: bug aomedia:363916152 - Enable unit tests for 4 to 3
|
|
// scaling when Neon and SSSE3 implementation of
|
|
// av1_resize_and_extend_frame do not differ from scalar version
|
|
if (sf_down == 4 && sf_up == 3) {
|
|
continue;
|
|
}
|
|
|
|
if (sf_up == sf_down && sf_up != 1) {
|
|
continue;
|
|
}
|
|
// I420 frame width and height must be even.
|
|
if (dst_width & 1 || dst_height & 1) {
|
|
continue;
|
|
}
|
|
ASSERT_NO_FATAL_FAILURE(ResetResizeImages(src_width, src_height,
|
|
dst_width, dst_height,
|
|
AOM_BORDER_IN_PIXELS));
|
|
|
|
aom_usec_timer ref_timer;
|
|
aom_usec_timer_start(&ref_timer);
|
|
for (int i = 0; i < kCountSpeedTestBlock; ++i)
|
|
av1_resize_and_extend_frame_c(&img_, &ref_img_, filter_type,
|
|
phase_scaler, 1);
|
|
aom_usec_timer_mark(&ref_timer);
|
|
const int64_t ref_time = aom_usec_timer_elapsed(&ref_timer);
|
|
|
|
aom_usec_timer tst_timer;
|
|
aom_usec_timer_start(&tst_timer);
|
|
for (int i = 0; i < kCountSpeedTestBlock; ++i)
|
|
resize_fn_(&img_, &dst_img_, filter_type, phase_scaler, 1);
|
|
aom_usec_timer_mark(&tst_timer);
|
|
const int64_t tst_time = aom_usec_timer_elapsed(&tst_timer);
|
|
DeallocResizeImages();
|
|
|
|
std::cout << "[ ] C time = " << ref_time / 1000
|
|
<< " ms, SIMD time = " << tst_time / 1000 << " ms\n";
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
YV12_BUFFER_CONFIG img_;
|
|
YV12_BUFFER_CONFIG ref_img_;
|
|
YV12_BUFFER_CONFIG dst_img_;
|
|
ResizeFrameFunc resize_fn_;
|
|
};
|
|
|
|
GTEST_ALLOW_UNINSTANTIATED_PARAMETERIZED_TEST(ResizeAndExtendTest);
|
|
|
|
TEST_P(ResizeAndExtendTest, ResizeFrame_EightTap) { RunTest(EIGHTTAP_REGULAR); }
|
|
TEST_P(ResizeAndExtendTest, ResizeFrame_EightTapSmooth) {
|
|
RunTest(EIGHTTAP_SMOOTH);
|
|
}
|
|
TEST_P(ResizeAndExtendTest, ResizeFrame_Bilinear) { RunTest(BILINEAR); }
|
|
TEST_P(ResizeAndExtendTest, DISABLED_Speed) { SpeedTest(); }
|
|
|
|
// TODO: bug aomedia:363916152 - Enable SSSE3 unit tests when implementation of
|
|
// av1_resize_and_extend_frame does not differ from scalar version
|
|
#if HAVE_SSSE3
|
|
INSTANTIATE_TEST_SUITE_P(DISABLED_SSSE3, ResizeAndExtendTest,
|
|
::testing::Values(av1_resize_and_extend_frame_ssse3));
|
|
#endif // HAVE_SSSE3
|
|
|
|
#if HAVE_NEON
|
|
INSTANTIATE_TEST_SUITE_P(NEON, ResizeAndExtendTest,
|
|
::testing::Values(av1_resize_and_extend_frame_neon));
|
|
#endif // HAVE_NEON
|
|
|
|
#if HAVE_NEON_DOTPROD
|
|
INSTANTIATE_TEST_SUITE_P(
|
|
NEON_DOTPROD, ResizeAndExtendTest,
|
|
::testing::Values(av1_resize_and_extend_frame_neon_dotprod));
|
|
|
|
#endif // HAVE_NEON_DOTPROD
|
|
|
|
#if HAVE_NEON_I8MM
|
|
INSTANTIATE_TEST_SUITE_P(
|
|
NEON_I8MM, ResizeAndExtendTest,
|
|
::testing::Values(av1_resize_and_extend_frame_neon_i8mm));
|
|
|
|
#endif // HAVE_NEON_I8MM
|
|
|
|
} // namespace
|