libbpg/x265/source/test/testbench.cpp

247 lines
7.6 KiB
C++
Raw Normal View History

2015-10-27 10:46:00 +00:00
/*****************************************************************************
* Copyright (C) 2013 x265 project
*
* Authors: Gopu Govindaswamy <gopu@govindaswamy.org>
* Mandar Gurav <mandar@multicorewareinc.com>
* Mahesh Pittala <mahesh@multicorewareinc.com>
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 2 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02111, USA.
*
* This program is also available under a commercial proprietary license.
* For more information, contact us at license @ x265.com.
*****************************************************************************/
#include "common.h"
#include "primitives.h"
#include "pixelharness.h"
#include "mbdstharness.h"
#include "ipfilterharness.h"
#include "intrapredharness.h"
#include "param.h"
#include "cpu.h"
using namespace X265_NS;
const char* lumaPartStr[NUM_PU_SIZES] =
{
" 4x4", " 8x8", "16x16", "32x32", "64x64",
" 8x4", " 4x8",
" 16x8", " 8x16",
"32x16", "16x32",
"64x32", "32x64",
"16x12", "12x16", " 16x4", " 4x16",
"32x24", "24x32", " 32x8", " 8x32",
"64x48", "48x64", "64x16", "16x64",
};
const char* chromaPartStr420[NUM_PU_SIZES] =
{
" 2x2", " 4x4", " 8x8", "16x16", "32x32",
" 4x2", " 2x4",
" 8x4", " 4x8",
" 16x8", " 8x16",
"32x16", "16x32",
" 8x6", " 6x8", " 8x2", " 2x8",
"16x12", "12x16", " 16x4", " 4x16",
"32x24", "24x32", " 32x8", " 8x32",
};
const char* chromaPartStr422[NUM_PU_SIZES] =
{
" 2x4", " 4x8", " 8x16", "16x32", "32x64",
" 4x4", " 2x8",
" 8x8", " 4x16",
"16x16", " 8x32",
"32x32", "16x64",
" 8x12", " 6x16", " 8x4", " 2x16",
"16x24", "12x32", " 16x8", " 4x32",
"32x48", "24x64", "32x16", " 8x64",
};
const char* const* chromaPartStr[X265_CSP_COUNT] =
{
lumaPartStr,
chromaPartStr420,
chromaPartStr422,
lumaPartStr
};
void do_help()
{
printf("x265 optimized primitive testbench\n\n");
printf("usage: TestBench [--cpuid CPU] [--testbench BENCH] [--help]\n\n");
printf(" CPU is comma separated SIMD arch list, example: SSE4,AVX\n");
printf(" BENCH is one of (pixel,transforms,interp,intrapred)\n\n");
printf("By default, the test bench will test all benches on detected CPU architectures\n");
printf("Options and testbench name may be truncated.\n");
}
PixelHarness HPixel;
MBDstHarness HMBDist;
IPFilterHarness HIPFilter;
IntraPredHarness HIPred;
int main(int argc, char *argv[])
{
int cpuid = X265_NS::cpu_detect();
const char *testname = 0;
if (!(argc & 1))
{
do_help();
return 0;
}
for (int i = 1; i < argc - 1; i += 2)
{
if (strncmp(argv[i], "--", 2))
{
printf("** invalid long argument: %s\n\n", argv[i]);
do_help();
return 1;
}
const char *name = argv[i] + 2;
const char *value = argv[i + 1];
if (!strncmp(name, "cpuid", strlen(name)))
{
bool bError = false;
cpuid = parseCpuName(value, bError);
if (bError)
{
printf("Invalid CPU name: %s\n", value);
return 1;
}
}
else if (!strncmp(name, "testbench", strlen(name)))
{
testname = value;
printf("Testing only harnesses that match name <%s>\n", testname);
}
else
{
printf("** invalid long argument: %s\n\n", name);
do_help();
return 1;
}
}
int seed = (int)time(NULL);
printf("Using random seed %X %dbit\n", seed, X265_DEPTH);
srand(seed);
// To disable classes of tests, simply comment them out in this list
TestHarness *harness[] =
{
&HPixel,
&HMBDist,
&HIPFilter,
&HIPred
};
EncoderPrimitives cprim;
memset(&cprim, 0, sizeof(EncoderPrimitives));
setupCPrimitives(cprim);
setupAliasPrimitives(cprim);
struct test_arch_t
{
char name[12];
int flag;
} test_arch[] =
{
{ "SSE2", X265_CPU_SSE2 },
{ "SSE3", X265_CPU_SSE3 },
{ "SSSE3", X265_CPU_SSSE3 },
{ "SSE4", X265_CPU_SSE4 },
{ "AVX", X265_CPU_AVX },
{ "XOP", X265_CPU_XOP },
{ "AVX2", X265_CPU_AVX2 },
{ "BMI2", X265_CPU_AVX2 | X265_CPU_BMI1 | X265_CPU_BMI2 },
{ "", 0 },
};
for (int i = 0; test_arch[i].flag; i++)
{
if ((test_arch[i].flag & cpuid) == test_arch[i].flag)
{
printf("Testing primitives: %s\n", test_arch[i].name);
fflush(stdout);
}
else
continue;
EncoderPrimitives vecprim;
memset(&vecprim, 0, sizeof(vecprim));
setupInstrinsicPrimitives(vecprim, test_arch[i].flag);
setupAliasPrimitives(vecprim);
for (size_t h = 0; h < sizeof(harness) / sizeof(TestHarness*); h++)
{
if (testname && strncmp(testname, harness[h]->getName(), strlen(testname)))
continue;
if (!harness[h]->testCorrectness(cprim, vecprim))
{
fflush(stdout);
fprintf(stderr, "\nx265: intrinsic primitive has failed. Go and fix that Right Now!\n");
return -1;
}
}
EncoderPrimitives asmprim;
memset(&asmprim, 0, sizeof(asmprim));
setupAssemblyPrimitives(asmprim, test_arch[i].flag);
setupAliasPrimitives(asmprim);
memcpy(&primitives, &asmprim, sizeof(EncoderPrimitives));
for (size_t h = 0; h < sizeof(harness) / sizeof(TestHarness*); h++)
{
if (testname && strncmp(testname, harness[h]->getName(), strlen(testname)))
continue;
if (!harness[h]->testCorrectness(cprim, asmprim))
{
fflush(stdout);
fprintf(stderr, "\nx265: asm primitive has failed. Go and fix that Right Now!\n");
return -1;
}
}
}
/******************* Cycle count for all primitives **********************/
EncoderPrimitives optprim;
memset(&optprim, 0, sizeof(optprim));
setupInstrinsicPrimitives(optprim, cpuid);
setupAssemblyPrimitives(optprim, cpuid);
/* Note that we do not setup aliases for performance tests, that would be
* redundant. The testbench only verifies they are correctly aliased */
/* some hybrid primitives may rely on other primitives in the
* global primitive table, so set up those pointers. This is a
* bit ugly, but I don't see a better solution */
memcpy(&primitives, &optprim, sizeof(EncoderPrimitives));
printf("\nTest performance improvement with full optimizations\n");
fflush(stdout);
for (size_t h = 0; h < sizeof(harness) / sizeof(TestHarness*); h++)
{
if (testname && strncmp(testname, harness[h]->getName(), strlen(testname)))
continue;
printf("== %s primitives ==\n", harness[h]->getName());
harness[h]->measureSpeed(cprim, optprim);
}
printf("\n");
return 0;
}