// Copyright 2014 The Chromium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
#include "base/base_paths.h"
#include "base/cpu.h"
#include "base/file_util.h"
#include "base/logging.h"
#include "base/path_service.h"
#include "base/time/time.h"
#include "media/base/simd/convert_yuv_to_rgb.h"
#include "media/base/yuv_convert.h"
#include "testing/gtest/include/gtest/gtest.h"
#include "testing/perf/perf_test.h"
namespace media {
#if !defined(ARCH_CPU_ARM_FAMILY) && !defined(ARCH_CPU_MIPS_FAMILY)
// Size of raw image.
static const int kSourceWidth = 640;
static const int kSourceHeight = 360;
static const int kSourceYSize = kSourceWidth * kSourceHeight;
static const int kSourceUOffset = kSourceYSize;
static const int kSourceVOffset = kSourceYSize * 5 / 4;
static const int kBpp = 4;
// Width of the row to convert. Odd so that we exercise the ending
// one-pixel-leftover case.
static const int kWidth = 639;
// Surface sizes for various test files.
static const int kYUV12Size = kSourceYSize * 12 / 8;
static const int kRGBSize = kSourceYSize * kBpp;
static const int kPerfTestIterations = 2000;
class YUVConvertPerfTest : public testing::Test {
public:
YUVConvertPerfTest()
: yuv_bytes_(new uint8[kYUV12Size]),
rgb_bytes_converted_(new uint8[kRGBSize]) {
base::FilePath path;
CHECK(PathService::Get(base::DIR_SOURCE_ROOT, &path));
path = path.Append(FILE_PATH_LITERAL("media"))
.Append(FILE_PATH_LITERAL("test"))
.Append(FILE_PATH_LITERAL("data"))
.Append(FILE_PATH_LITERAL("bali_640x360_P420.yuv"));
// Verify file size is correct.
int64 actual_size = 0;
base::GetFileSize(path, &actual_size);
CHECK_EQ(actual_size, kYUV12Size);
// Verify bytes read are correct.
int bytes_read = base::ReadFile(
path, reinterpret_cast<char*>(yuv_bytes_.get()), kYUV12Size);
CHECK_EQ(bytes_read, kYUV12Size);
}
scoped_ptr<uint8[]> yuv_bytes_;
scoped_ptr<uint8[]> rgb_bytes_converted_;
private:
DISALLOW_COPY_AND_ASSIGN(YUVConvertPerfTest);
};
TEST_F(YUVConvertPerfTest, ConvertYUVToRGB32Row_MMX) {
ASSERT_TRUE(base::CPU().has_mmx());
base::TimeTicks start = base::TimeTicks::HighResNow();
for (int i = 0; i < kPerfTestIterations; ++i) {
for (int row = 0; row < kSourceHeight; ++row) {
int chroma_row = row / 2;
ConvertYUVToRGB32Row_MMX(
yuv_bytes_.get() + row * kSourceWidth,
yuv_bytes_.get() + kSourceUOffset + (chroma_row * kSourceWidth / 2),
yuv_bytes_.get() + kSourceVOffset + (chroma_row * kSourceWidth / 2),
rgb_bytes_converted_.get(),
kWidth,
GetLookupTable(YV12));
}
}
double total_time_seconds =
(base::TimeTicks::HighResNow() - start).InSecondsF();
perf_test::PrintResult(
"yuv_convert_perftest", "", "ConvertYUVToRGB32Row_MMX",
kPerfTestIterations / total_time_seconds, "runs/s", true);
media::EmptyRegisterState();
}
TEST_F(YUVConvertPerfTest, ConvertYUVToRGB32Row_SSE) {
ASSERT_TRUE(base::CPU().has_sse());
base::TimeTicks start = base::TimeTicks::HighResNow();
for (int i = 0; i < kPerfTestIterations; ++i) {
for (int row = 0; row < kSourceHeight; ++row) {
int chroma_row = row / 2;
ConvertYUVToRGB32Row_SSE(
yuv_bytes_.get() + row * kSourceWidth,
yuv_bytes_.get() + kSourceUOffset + (chroma_row * kSourceWidth / 2),
yuv_bytes_.get() + kSourceVOffset + (chroma_row * kSourceWidth / 2),
rgb_bytes_converted_.get(),
kWidth,
GetLookupTable(YV12));
}
}
double total_time_seconds =
(base::TimeTicks::HighResNow() - start).InSecondsF();
perf_test::PrintResult(
"yuv_convert_perftest", "", "ConvertYUVToRGB32Row_SSE",
kPerfTestIterations / total_time_seconds, "runs/s", true);
media::EmptyRegisterState();
}
TEST_F(YUVConvertPerfTest, ScaleYUVToRGB32Row_MMX) {
ASSERT_TRUE(base::CPU().has_mmx());
const int kSourceDx = 80000; // This value means a scale down.
base::TimeTicks start = base::TimeTicks::HighResNow();
for (int i = 0; i < kPerfTestIterations; ++i) {
for (int row = 0; row < kSourceHeight; ++row) {
int chroma_row = row / 2;
ScaleYUVToRGB32Row_MMX(
yuv_bytes_.get() + row * kSourceWidth,
yuv_bytes_.get() + kSourceUOffset + (chroma_row * kSourceWidth / 2),
yuv_bytes_.get() + kSourceVOffset + (chroma_row * kSourceWidth / 2),
rgb_bytes_converted_.get(),
kWidth,
kSourceDx,
GetLookupTable(YV12));
}
}
double total_time_seconds =
(base::TimeTicks::HighResNow() - start).InSecondsF();
perf_test::PrintResult(
"yuv_convert_perftest", "", "ScaleYUVToRGB32Row_MMX",
kPerfTestIterations / total_time_seconds, "runs/s", true);
media::EmptyRegisterState();
}
TEST_F(YUVConvertPerfTest, ScaleYUVToRGB32Row_SSE) {
ASSERT_TRUE(base::CPU().has_sse());
const int kSourceDx = 80000; // This value means a scale down.
base::TimeTicks start = base::TimeTicks::HighResNow();
for (int i = 0; i < kPerfTestIterations; ++i) {
for (int row = 0; row < kSourceHeight; ++row) {
int chroma_row = row / 2;
ScaleYUVToRGB32Row_SSE(
yuv_bytes_.get() + row * kSourceWidth,
yuv_bytes_.get() + kSourceUOffset + (chroma_row * kSourceWidth / 2),
yuv_bytes_.get() + kSourceVOffset + (chroma_row * kSourceWidth / 2),
rgb_bytes_converted_.get(),
kWidth,
kSourceDx,
GetLookupTable(YV12));
}
}
double total_time_seconds =
(base::TimeTicks::HighResNow() - start).InSecondsF();
perf_test::PrintResult(
"yuv_convert_perftest", "", "ScaleYUVToRGB32Row_SSE",
kPerfTestIterations / total_time_seconds, "runs/s", true);
media::EmptyRegisterState();
}
TEST_F(YUVConvertPerfTest, LinearScaleYUVToRGB32Row_MMX) {
ASSERT_TRUE(base::CPU().has_mmx());
const int kSourceDx = 80000; // This value means a scale down.
base::TimeTicks start = base::TimeTicks::HighResNow();
for (int i = 0; i < kPerfTestIterations; ++i) {
for (int row = 0; row < kSourceHeight; ++row) {
int chroma_row = row / 2;
LinearScaleYUVToRGB32Row_MMX(
yuv_bytes_.get() + row * kSourceWidth,
yuv_bytes_.get() + kSourceUOffset + (chroma_row * kSourceWidth / 2),
yuv_bytes_.get() + kSourceVOffset + (chroma_row * kSourceWidth / 2),
rgb_bytes_converted_.get(),
kWidth,
kSourceDx,
GetLookupTable(YV12));
}
}
double total_time_seconds =
(base::TimeTicks::HighResNow() - start).InSecondsF();
perf_test::PrintResult(
"yuv_convert_perftest", "", "LinearScaleYUVToRGB32Row_MMX",
kPerfTestIterations / total_time_seconds, "runs/s", true);
media::EmptyRegisterState();
}
TEST_F(YUVConvertPerfTest, LinearScaleYUVToRGB32Row_SSE) {
ASSERT_TRUE(base::CPU().has_sse());
const int kSourceDx = 80000; // This value means a scale down.
base::TimeTicks start = base::TimeTicks::HighResNow();
for (int i = 0; i < kPerfTestIterations; ++i) {
for (int row = 0; row < kSourceHeight; ++row) {
int chroma_row = row / 2;
LinearScaleYUVToRGB32Row_SSE(
yuv_bytes_.get() + row * kSourceWidth,
yuv_bytes_.get() + kSourceUOffset + (chroma_row * kSourceWidth / 2),
yuv_bytes_.get() + kSourceVOffset + (chroma_row * kSourceWidth / 2),
rgb_bytes_converted_.get(),
kWidth,
kSourceDx,
GetLookupTable(YV12));
}
}
double total_time_seconds =
(base::TimeTicks::HighResNow() - start).InSecondsF();
perf_test::PrintResult(
"yuv_convert_perftest", "", "LinearScaleYUVToRGB32Row_SSE",
kPerfTestIterations / total_time_seconds, "runs/s", true);
media::EmptyRegisterState();
}
#endif // !defined(ARCH_CPU_ARM_FAMILY) && !defined(ARCH_CPU_MIPS_FAMILY)
} // namespace media