libbpg/x265/source/x265.cpp
2015-10-27 11:46:00 +01:00

754 lines
23 KiB
C++

/*****************************************************************************
* Copyright (C) 2013 x265 project
*
* Authors: Steve Borho <steve@borho.org>
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 2 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02111, USA.
*
* This program is also available under a commercial proprietary license.
* For more information, contact us at license @ x265.com.
*****************************************************************************/
#if _MSC_VER
#pragma warning(disable: 4127) // conditional expression is constant, yes I know
#endif
#include "x265.h"
#include "x265-extras.h"
#include "x265cli.h"
#include "common.h"
#include "input/input.h"
#include "output/output.h"
#include "output/reconplay.h"
#include "param.h"
#include "cpu.h"
#if HAVE_VLD
/* Visual Leak Detector */
#include <vld.h>
#endif
#include <signal.h>
#include <errno.h>
#include <fcntl.h>
#include <string>
#include <ostream>
#include <fstream>
#include <queue>
#define CONSOLE_TITLE_SIZE 200
#ifdef _WIN32
#include <windows.h>
static char orgConsoleTitle[CONSOLE_TITLE_SIZE] = "";
#else
#define GetConsoleTitle(t, n)
#define SetConsoleTitle(t)
#define SetThreadExecutionState(es)
#endif
using namespace X265_NS;
/* Ctrl-C handler */
static volatile sig_atomic_t b_ctrl_c /* = 0 */;
static void sigint_handler(int)
{
b_ctrl_c = 1;
}
struct CLIOptions
{
InputFile* input;
ReconFile* recon;
OutputFile* output;
FILE* qpfile;
FILE* csvfpt;
const char* csvfn;
const char* reconPlayCmd;
const x265_api* api;
x265_param* param;
bool bProgress;
bool bForceY4m;
bool bDither;
int csvLogLevel;
uint32_t seek; // number of frames to skip from the beginning
uint32_t framesToBeEncoded; // number of frames to encode
uint64_t totalbytes;
int64_t startTime;
int64_t prevUpdateTime;
/* in microseconds */
static const int UPDATE_INTERVAL = 250000;
CLIOptions()
{
input = NULL;
recon = NULL;
output = NULL;
qpfile = NULL;
csvfpt = NULL;
csvfn = NULL;
reconPlayCmd = NULL;
api = NULL;
param = NULL;
framesToBeEncoded = seek = 0;
totalbytes = 0;
bProgress = true;
bForceY4m = false;
startTime = x265_mdate();
prevUpdateTime = 0;
bDither = false;
csvLogLevel = 0;
}
void destroy();
void printStatus(uint32_t frameNum);
bool parse(int argc, char **argv);
bool parseQPFile(x265_picture &pic_org);
};
void CLIOptions::destroy()
{
if (input)
input->release();
input = NULL;
if (recon)
recon->release();
recon = NULL;
if (qpfile)
fclose(qpfile);
qpfile = NULL;
if (csvfpt)
fclose(csvfpt);
csvfpt = NULL;
if (output)
output->release();
output = NULL;
}
void CLIOptions::printStatus(uint32_t frameNum)
{
char buf[200];
int64_t time = x265_mdate();
if (!bProgress || !frameNum || (prevUpdateTime && time - prevUpdateTime < UPDATE_INTERVAL))
return;
int64_t elapsed = time - startTime;
double fps = elapsed > 0 ? frameNum * 1000000. / elapsed : 0;
float bitrate = 0.008f * totalbytes * (param->fpsNum / param->fpsDenom) / ((float)frameNum);
if (framesToBeEncoded)
{
int eta = (int)(elapsed * (framesToBeEncoded - frameNum) / ((int64_t)frameNum * 1000000));
sprintf(buf, "x265 [%.1f%%] %d/%d frames, %.2f fps, %.2f kb/s, eta %d:%02d:%02d",
100. * frameNum / framesToBeEncoded, frameNum, framesToBeEncoded, fps, bitrate,
eta / 3600, (eta / 60) % 60, eta % 60);
}
else
sprintf(buf, "x265 %d frames: %.2f fps, %.2f kb/s", frameNum, fps, bitrate);
fprintf(stderr, "%s \r", buf + 5);
SetConsoleTitle(buf);
fflush(stderr); // needed in windows
prevUpdateTime = time;
}
bool CLIOptions::parse(int argc, char **argv)
{
bool bError = false;
int bShowHelp = false;
int inputBitDepth = 8;
int outputBitDepth = 0;
int reconFileBitDepth = 0;
const char *inputfn = NULL;
const char *reconfn = NULL;
const char *outputfn = NULL;
const char *preset = NULL;
const char *tune = NULL;
const char *profile = NULL;
if (argc <= 1)
{
x265_log(NULL, X265_LOG_ERROR, "No input file. Run x265 --help for a list of options.\n");
return true;
}
/* Presets are applied before all other options. */
for (optind = 0;; )
{
int c = getopt_long(argc, argv, short_options, long_options, NULL);
if (c == -1)
break;
else if (c == 'p')
preset = optarg;
else if (c == 't')
tune = optarg;
else if (c == 'D')
outputBitDepth = atoi(optarg);
else if (c == 'P')
profile = optarg;
else if (c == '?')
bShowHelp = true;
}
if (!outputBitDepth && profile)
{
/* try to derive the output bit depth from the requested profile */
if (strstr(profile, "10"))
outputBitDepth = 10;
else if (strstr(profile, "12"))
outputBitDepth = 12;
else
outputBitDepth = 8;
}
api = x265_api_get(outputBitDepth);
if (!api)
{
x265_log(NULL, X265_LOG_WARNING, "falling back to default bit-depth\n");
api = x265_api_get(0);
}
param = api->param_alloc();
if (!param)
{
x265_log(NULL, X265_LOG_ERROR, "param alloc failed\n");
return true;
}
if (api->param_default_preset(param, preset, tune) < 0)
{
x265_log(NULL, X265_LOG_ERROR, "preset or tune unrecognized\n");
return true;
}
if (bShowHelp)
{
printVersion(param, api);
showHelp(param);
}
for (optind = 0;; )
{
int long_options_index = -1;
int c = getopt_long(argc, argv, short_options, long_options, &long_options_index);
if (c == -1)
break;
switch (c)
{
case 'h':
printVersion(param, api);
showHelp(param);
break;
case 'V':
printVersion(param, api);
x265_report_simd(param);
exit(0);
default:
if (long_options_index < 0 && c > 0)
{
for (size_t i = 0; i < sizeof(long_options) / sizeof(long_options[0]); i++)
{
if (long_options[i].val == c)
{
long_options_index = (int)i;
break;
}
}
if (long_options_index < 0)
{
/* getopt_long might have already printed an error message */
if (c != 63)
x265_log(NULL, X265_LOG_WARNING, "internal error: short option '%c' has no long option\n", c);
return true;
}
}
if (long_options_index < 0)
{
x265_log(NULL, X265_LOG_WARNING, "short option '%c' unrecognized\n", c);
return true;
}
#define OPT(longname) \
else if (!strcmp(long_options[long_options_index].name, longname))
#define OPT2(name1, name2) \
else if (!strcmp(long_options[long_options_index].name, name1) || \
!strcmp(long_options[long_options_index].name, name2))
if (0) ;
OPT2("frame-skip", "seek") this->seek = (uint32_t)x265_atoi(optarg, bError);
OPT("frames") this->framesToBeEncoded = (uint32_t)x265_atoi(optarg, bError);
OPT("csv") this->csvfn = optarg;
OPT("csv-log-level") this->csvLogLevel = x265_atoi(optarg, bError);
OPT("no-progress") this->bProgress = false;
OPT("output") outputfn = optarg;
OPT("input") inputfn = optarg;
OPT("recon") reconfn = optarg;
OPT("input-depth") inputBitDepth = (uint32_t)x265_atoi(optarg, bError);
OPT("dither") this->bDither = true;
OPT("recon-depth") reconFileBitDepth = (uint32_t)x265_atoi(optarg, bError);
OPT("y4m") this->bForceY4m = true;
OPT("profile") /* handled above */;
OPT("preset") /* handled above */;
OPT("tune") /* handled above */;
OPT("output-depth") /* handled above */;
OPT("recon-y4m-exec") reconPlayCmd = optarg;
OPT("qpfile")
{
this->qpfile = fopen(optarg, "rb");
if (!this->qpfile)
{
x265_log(param, X265_LOG_ERROR, "%s qpfile not found or error in opening qp file\n", optarg);
return false;
}
}
else
bError |= !!api->param_parse(param, long_options[long_options_index].name, optarg);
if (bError)
{
const char *name = long_options_index > 0 ? long_options[long_options_index].name : argv[optind - 2];
x265_log(NULL, X265_LOG_ERROR, "invalid argument: %s = %s\n", name, optarg);
return true;
}
#undef OPT
}
}
if (optind < argc && !inputfn)
inputfn = argv[optind++];
if (optind < argc && !outputfn)
outputfn = argv[optind++];
if (optind < argc)
{
x265_log(param, X265_LOG_WARNING, "extra unused command arguments given <%s>\n", argv[optind]);
return true;
}
if (argc <= 1)
{
api->param_default(param);
printVersion(param, api);
showHelp(param);
}
if (!inputfn || !outputfn)
{
x265_log(param, X265_LOG_ERROR, "input or output file not specified, try --help for help\n");
return true;
}
if (param->internalBitDepth != api->bit_depth)
{
x265_log(param, X265_LOG_ERROR, "Only bit depths of %d are supported in this build\n", api->bit_depth);
return true;
}
InputFileInfo info;
info.filename = inputfn;
info.depth = inputBitDepth;
info.csp = param->internalCsp;
info.width = param->sourceWidth;
info.height = param->sourceHeight;
info.fpsNum = param->fpsNum;
info.fpsDenom = param->fpsDenom;
info.sarWidth = param->vui.sarWidth;
info.sarHeight = param->vui.sarHeight;
info.skipFrames = seek;
info.frameCount = 0;
getParamAspectRatio(param, info.sarWidth, info.sarHeight);
this->input = InputFile::open(info, this->bForceY4m);
if (!this->input || this->input->isFail())
{
x265_log(param, X265_LOG_ERROR, "unable to open input file <%s>\n", inputfn);
return true;
}
if (info.depth < 8 || info.depth > 16)
{
x265_log(param, X265_LOG_ERROR, "Input bit depth (%d) must be between 8 and 16\n", inputBitDepth);
return true;
}
/* Unconditionally accept height/width/csp from file info */
param->sourceWidth = info.width;
param->sourceHeight = info.height;
param->internalCsp = info.csp;
/* Accept fps and sar from file info if not specified by user */
if (param->fpsDenom == 0 || param->fpsNum == 0)
{
param->fpsDenom = info.fpsDenom;
param->fpsNum = info.fpsNum;
}
if (!param->vui.aspectRatioIdc && info.sarWidth && info.sarHeight)
setParamAspectRatio(param, info.sarWidth, info.sarHeight);
if (this->framesToBeEncoded == 0 && info.frameCount > (int)seek)
this->framesToBeEncoded = info.frameCount - seek;
param->totalFrames = this->framesToBeEncoded;
/* Force CFR until we have support for VFR */
info.timebaseNum = param->fpsDenom;
info.timebaseDenom = param->fpsNum;
if (api->param_apply_profile(param, profile))
return true;
if (param->logLevel >= X265_LOG_INFO)
{
char buf[128];
int p = sprintf(buf, "%dx%d fps %d/%d %sp%d", param->sourceWidth, param->sourceHeight,
param->fpsNum, param->fpsDenom, x265_source_csp_names[param->internalCsp], info.depth);
int width, height;
getParamAspectRatio(param, width, height);
if (width && height)
p += sprintf(buf + p, " sar %d:%d", width, height);
if (framesToBeEncoded <= 0 || info.frameCount <= 0)
strcpy(buf + p, " unknown frame count");
else
sprintf(buf + p, " frames %u - %d of %d", this->seek, this->seek + this->framesToBeEncoded - 1, info.frameCount);
general_log(param, input->getName(), X265_LOG_INFO, "%s\n", buf);
}
this->input->startReader();
if (reconfn)
{
if (reconFileBitDepth == 0)
reconFileBitDepth = param->internalBitDepth;
this->recon = ReconFile::open(reconfn, param->sourceWidth, param->sourceHeight, reconFileBitDepth,
param->fpsNum, param->fpsDenom, param->internalCsp);
if (this->recon->isFail())
{
x265_log(param, X265_LOG_WARNING, "unable to write reconstructed outputs file\n");
this->recon->release();
this->recon = 0;
}
else
general_log(param, this->recon->getName(), X265_LOG_INFO,
"reconstructed images %dx%d fps %d/%d %s\n",
param->sourceWidth, param->sourceHeight, param->fpsNum, param->fpsDenom,
x265_source_csp_names[param->internalCsp]);
}
this->output = OutputFile::open(outputfn, info);
if (this->output->isFail())
{
x265_log(param, X265_LOG_ERROR, "failed to open output file <%s> for writing\n", outputfn);
return true;
}
general_log(param, this->output->getName(), X265_LOG_INFO, "output file: %s\n", outputfn);
return false;
}
bool CLIOptions::parseQPFile(x265_picture &pic_org)
{
int32_t num = -1, qp, ret;
char type;
uint32_t filePos;
pic_org.forceqp = 0;
pic_org.sliceType = X265_TYPE_AUTO;
while (num < pic_org.poc)
{
filePos = ftell(qpfile);
qp = -1;
ret = fscanf(qpfile, "%d %c%*[ \t]%d\n", &num, &type, &qp);
if (num > pic_org.poc || ret == EOF)
{
fseek(qpfile, filePos, SEEK_SET);
break;
}
if (num < pic_org.poc && ret >= 2)
continue;
if (ret == 3 && qp >= 0)
pic_org.forceqp = qp + 1;
if (type == 'I') pic_org.sliceType = X265_TYPE_IDR;
else if (type == 'i') pic_org.sliceType = X265_TYPE_I;
else if (type == 'P') pic_org.sliceType = X265_TYPE_P;
else if (type == 'B') pic_org.sliceType = X265_TYPE_BREF;
else if (type == 'b') pic_org.sliceType = X265_TYPE_B;
else ret = 0;
if (ret < 2 || qp < -1 || qp > 51)
return 0;
}
return 1;
}
/* CLI return codes:
*
* 0 - encode successful
* 1 - unable to parse command line
* 2 - unable to open encoder
* 3 - unable to generate stream headers
* 4 - encoder abort
* 5 - unable to open csv file */
int main(int argc, char **argv)
{
#if HAVE_VLD
// This uses Microsoft's proprietary WCHAR type, but this only builds on Windows to start with
VLDSetReportOptions(VLD_OPT_REPORT_TO_DEBUGGER | VLD_OPT_REPORT_TO_FILE, L"x265_leaks.txt");
#endif
PROFILE_INIT();
THREAD_NAME("API", 0);
GetConsoleTitle(orgConsoleTitle, CONSOLE_TITLE_SIZE);
SetThreadExecutionState(ES_CONTINUOUS | ES_SYSTEM_REQUIRED | ES_AWAYMODE_REQUIRED);
ReconPlay* reconPlay = NULL;
CLIOptions cliopt;
if (cliopt.parse(argc, argv))
{
cliopt.destroy();
if (cliopt.api)
cliopt.api->param_free(cliopt.param);
exit(1);
}
x265_param* param = cliopt.param;
const x265_api* api = cliopt.api;
/* This allows muxers to modify bitstream format */
cliopt.output->setParam(param);
if (cliopt.reconPlayCmd)
reconPlay = new ReconPlay(cliopt.reconPlayCmd, *param);
/* note: we could try to acquire a different libx265 API here based on
* the profile found during option parsing, but it must be done before
* opening an encoder */
x265_encoder *encoder = api->encoder_open(param);
if (!encoder)
{
x265_log(param, X265_LOG_ERROR, "failed to open encoder\n");
cliopt.destroy();
api->param_free(param);
api->cleanup();
exit(2);
}
/* get the encoder parameters post-initialization */
api->encoder_parameters(encoder, param);
if (cliopt.csvfn)
{
cliopt.csvfpt = x265_csvlog_open(*api, *param, cliopt.csvfn, cliopt.csvLogLevel);
if (!cliopt.csvfpt)
{
x265_log(param, X265_LOG_ERROR, "Unable to open CSV log file <%s>, aborting\n", cliopt.csvfn);
cliopt.destroy();
if (cliopt.api)
cliopt.api->param_free(cliopt.param);
exit(5);
}
}
/* Control-C handler */
if (signal(SIGINT, sigint_handler) == SIG_ERR)
x265_log(param, X265_LOG_ERROR, "Unable to register CTRL+C handler: %s\n", strerror(errno));
x265_picture pic_orig, pic_out;
x265_picture *pic_in = &pic_orig;
/* Allocate recon picture if analysisMode is enabled */
std::priority_queue<int64_t>* pts_queue = cliopt.output->needPTS() ? new std::priority_queue<int64_t>() : NULL;
x265_picture *pic_recon = (cliopt.recon || !!param->analysisMode || pts_queue || reconPlay || cliopt.csvLogLevel) ? &pic_out : NULL;
uint32_t inFrameCount = 0;
uint32_t outFrameCount = 0;
x265_nal *p_nal;
x265_stats stats;
uint32_t nal;
int16_t *errorBuf = NULL;
int ret = 0;
if (!param->bRepeatHeaders)
{
if (api->encoder_headers(encoder, &p_nal, &nal) < 0)
{
x265_log(param, X265_LOG_ERROR, "Failure generating stream headers\n");
ret = 3;
goto fail;
}
else
cliopt.totalbytes += cliopt.output->writeHeaders(p_nal, nal);
}
api->picture_init(param, pic_in);
if (cliopt.bDither)
{
errorBuf = X265_MALLOC(int16_t, param->sourceWidth + 1);
if (errorBuf)
memset(errorBuf, 0, (param->sourceWidth + 1) * sizeof(int16_t));
else
cliopt.bDither = false;
}
// main encoder loop
while (pic_in && !b_ctrl_c)
{
pic_orig.poc = inFrameCount;
if (cliopt.qpfile)
{
if (!cliopt.parseQPFile(pic_orig))
{
x265_log(NULL, X265_LOG_ERROR, "can't parse qpfile for frame %d\n", pic_in->poc);
fclose(cliopt.qpfile);
cliopt.qpfile = NULL;
}
}
if (cliopt.framesToBeEncoded && inFrameCount >= cliopt.framesToBeEncoded)
pic_in = NULL;
else if (cliopt.input->readPicture(pic_orig))
inFrameCount++;
else
pic_in = NULL;
if (pic_in)
{
if (pic_in->bitDepth > param->internalBitDepth && cliopt.bDither)
{
x265_dither_image(*api, *pic_in, param->sourceWidth, param->sourceHeight, errorBuf, param->internalBitDepth);
pic_in->bitDepth = param->internalBitDepth;
}
/* Overwrite PTS */
pic_in->pts = pic_in->poc;
}
int numEncoded = api->encoder_encode(encoder, &p_nal, &nal, pic_in, pic_recon);
if (numEncoded < 0)
{
b_ctrl_c = 1;
ret = 4;
break;
}
if (reconPlay && numEncoded)
reconPlay->writePicture(*pic_recon);
outFrameCount += numEncoded;
if (numEncoded && pic_recon && cliopt.recon)
cliopt.recon->writePicture(pic_out);
if (nal)
{
cliopt.totalbytes += cliopt.output->writeFrame(p_nal, nal, pic_out);
if (pts_queue)
{
pts_queue->push(-pic_out.pts);
if (pts_queue->size() > 2)
pts_queue->pop();
}
}
cliopt.printStatus(outFrameCount);
if (numEncoded && cliopt.csvLogLevel)
x265_csvlog_frame(cliopt.csvfpt, *param, *pic_recon, cliopt.csvLogLevel);
}
/* Flush the encoder */
while (!b_ctrl_c)
{
int numEncoded = api->encoder_encode(encoder, &p_nal, &nal, NULL, pic_recon);
if (numEncoded < 0)
{
ret = 4;
break;
}
if (reconPlay && numEncoded)
reconPlay->writePicture(*pic_recon);
outFrameCount += numEncoded;
if (numEncoded && pic_recon && cliopt.recon)
cliopt.recon->writePicture(pic_out);
if (nal)
{
cliopt.totalbytes += cliopt.output->writeFrame(p_nal, nal, pic_out);
if (pts_queue)
{
pts_queue->push(-pic_out.pts);
if (pts_queue->size() > 2)
pts_queue->pop();
}
}
cliopt.printStatus(outFrameCount);
if (numEncoded && cliopt.csvLogLevel)
x265_csvlog_frame(cliopt.csvfpt, *param, *pic_recon, cliopt.csvLogLevel);
if (!numEncoded)
break;
}
/* clear progress report */
if (cliopt.bProgress)
fprintf(stderr, "%*s\r", 80, " ");
fail:
delete reconPlay;
api->encoder_get_stats(encoder, &stats, sizeof(stats));
if (cliopt.csvfpt && !b_ctrl_c)
x265_csvlog_encode(cliopt.csvfpt, *api, *param, stats, cliopt.csvLogLevel, argc, argv);
api->encoder_close(encoder);
int64_t second_largest_pts = 0;
int64_t largest_pts = 0;
if (pts_queue && pts_queue->size() >= 2)
{
second_largest_pts = -pts_queue->top();
pts_queue->pop();
largest_pts = -pts_queue->top();
pts_queue->pop();
delete pts_queue;
pts_queue = NULL;
}
cliopt.output->closeFile(largest_pts, second_largest_pts);
if (b_ctrl_c)
general_log(param, NULL, X265_LOG_INFO, "aborted at input frame %d, output frame %d\n",
cliopt.seek + inFrameCount, stats.encodedPictureCount);
api->cleanup(); /* Free library singletons */
cliopt.destroy();
api->param_free(param);
X265_FREE(errorBuf);
SetConsoleTitle(orgConsoleTitle);
SetThreadExecutionState(ES_CONTINUOUS);
#if HAVE_VLD
assert(VLDReportLeaks() == 0);
#endif
return ret;
}