| Index: tools/skpbench/skpbench.cpp
|
| diff --git a/tools/skpbench/skpbench.cpp b/tools/skpbench/skpbench.cpp
|
| new file mode 100644
|
| index 0000000000000000000000000000000000000000..afe44b5c7b022f0bbd2d7c3d1d3d4ccaa5da9f37
|
| --- /dev/null
|
| +++ b/tools/skpbench/skpbench.cpp
|
| @@ -0,0 +1,326 @@
|
| +/*
|
| + * Copyright 2016 Google Inc.
|
| + *
|
| + * Use of this source code is governed by a BSD-style license that can be
|
| + * found in the LICENSE file.
|
| + */
|
| +
|
| +#include "GrContextFactory.h"
|
| +#include "SkCanvas.h"
|
| +#include "SkOSFile.h"
|
| +#include "SkPicture.h"
|
| +#include "SkStream.h"
|
| +#include "SkSurface.h"
|
| +#include "SkSurfaceProps.h"
|
| +#include "picture_utils.h"
|
| +#include "flags/SkCommandLineFlags.h"
|
| +#include "flags/SkCommonFlagsConfig.h"
|
| +#include <stdlib.h>
|
| +#include <algorithm>
|
| +#include <array>
|
| +#include <chrono>
|
| +#include <cmath>
|
| +#include <vector>
|
| +
|
| +/**
|
| + * This is a minimalist program whose sole purpose is to open an skp file, benchmark it on a single
|
| + * config, and exit. It is intended to be used through skpbench.py rather than invoked directly.
|
| + * Limiting the entire process to a single config/skp pair helps to keep the results repeatable.
|
| + *
|
| + * No tiling, looping, or other fanciness is used; it just draws the skp whole into a size-matched
|
| + * render target and syncs the GPU after each draw.
|
| + *
|
| + * The results consist of a fixed amount of samples (--samples). A sample is defined as the number
|
| + * of frames rendered within a set amount of time (--sampleMs).
|
| + *
|
| + * Currently, only GPU configs are supported.
|
| + */
|
| +
|
| +DEFINE_int32(samples, 101, "number of samples to collect");
|
| +DEFINE_int32(sampleMs, 50, "duration of each sample");
|
| +DEFINE_bool(fps, false, "use fps instead of ms");
|
| +DEFINE_string(skp, "", "path to a single .skp file to benchmark");
|
| +DEFINE_string(png, "", "if set, save a .png proof to disk at this file location");
|
| +DEFINE_int32(verbosity, 4, "level of verbosity (0=none to 5=debug)");
|
| +DEFINE_bool(suppressHeader, false, "don't print a header row before the results");
|
| +
|
| +static const char* header =
|
| + " median accum max min stddev metric samples sample_ms config bench";
|
| +
|
| +static const char* resultFormat =
|
| + "%8.4g %8.4g %8.4g %8.4g %6.3g%% %-6s %7li %9i %-9s %s";
|
| +
|
| +struct Sample {
|
| + using clock = std::chrono::high_resolution_clock;
|
| +
|
| + Sample() : fFrames(0), fDuration(0) {}
|
| + double seconds() const { return std::chrono::duration<double>(fDuration).count(); }
|
| + double ms() const { return std::chrono::duration<double, std::milli>(fDuration).count(); }
|
| + double value() const { return FLAGS_fps ? fFrames / this->seconds() : this->ms() / fFrames; }
|
| + static const char* metric() { return FLAGS_fps ? "fps" : "ms"; }
|
| +
|
| + int fFrames;
|
| + clock::duration fDuration;
|
| +};
|
| +
|
| +enum class ExitErr {
|
| + kOk = 0,
|
| + kUsage = 64,
|
| + kData = 65,
|
| + kUnavailable = 69,
|
| + kIO = 74,
|
| + kSoftware = 70
|
| +};
|
| +
|
| +static void draw_skp_and_flush(SkCanvas*, const SkPicture*);
|
| +static SkPlatformGpuFence insert_verified_fence(const SkGpuFenceSync*);
|
| +static void wait_fence_and_delete(const SkGpuFenceSync*, SkPlatformGpuFence);
|
| +static bool mkdir_p(const SkString& name);
|
| +static SkString join(const SkCommandLineFlags::StringArray&);
|
| +static void exitf(ExitErr, const char* format, ...);
|
| +
|
| +static void run_benchmark(const SkGpuFenceSync* sync, SkCanvas* canvas, const SkPicture* skp,
|
| + std::vector<Sample>* samples) {
|
| + using clock = Sample::clock;
|
| + std::chrono::milliseconds sampleMs(FLAGS_sampleMs);
|
| +
|
| + samples->clear();
|
| + samples->resize(FLAGS_samples);
|
| +
|
| + // Prime the graphics pipe.
|
| + SkPlatformGpuFence frameN_minus_2, frameN_minus_1;
|
| + {
|
| + draw_skp_and_flush(canvas, skp);
|
| + SkPlatformGpuFence frame0 = insert_verified_fence(sync);
|
| +
|
| + draw_skp_and_flush(canvas, skp);
|
| + frameN_minus_2 = insert_verified_fence(sync);
|
| +
|
| + draw_skp_and_flush(canvas, skp);
|
| + frameN_minus_1 = insert_verified_fence(sync);
|
| +
|
| + wait_fence_and_delete(sync, frame0);
|
| + }
|
| +
|
| + clock::time_point start = clock::now();
|
| +
|
| + for (Sample& sample : *samples) {
|
| + clock::time_point end;
|
| + do {
|
| + draw_skp_and_flush(canvas, skp);
|
| +
|
| + // Sync the GPU.
|
| + wait_fence_and_delete(sync, frameN_minus_2);
|
| + frameN_minus_2 = frameN_minus_1;
|
| + frameN_minus_1 = insert_verified_fence(sync);
|
| +
|
| + end = clock::now();
|
| + sample.fDuration = end - start;
|
| + ++sample.fFrames;
|
| + } while (sample.fDuration < sampleMs);
|
| +
|
| + if (FLAGS_verbosity >= 5) {
|
| + fprintf(stderr, "%.4g%s [ms=%.4g frames=%i]\n",
|
| + sample.value(), Sample::metric(), sample.ms(), sample.fFrames);
|
| + }
|
| +
|
| + start = end;
|
| + }
|
| +
|
| + sync->deleteFence(frameN_minus_2);
|
| + sync->deleteFence(frameN_minus_1);
|
| +}
|
| +
|
| +void print_result(const std::vector<Sample>& samples, const char* config, const char* bench) {
|
| + if (0 == (samples.size() % 2)) {
|
| + exitf(ExitErr::kSoftware, "attempted to gather stats on even number of samples");
|
| + }
|
| +
|
| + Sample accum = Sample();
|
| + std::vector<double> values;
|
| + values.reserve(samples.size());
|
| + for (const Sample& sample : samples) {
|
| + accum.fFrames += sample.fFrames;
|
| + accum.fDuration += sample.fDuration;
|
| + values.push_back(sample.value());
|
| + }
|
| + std::sort(values.begin(), values.end());
|
| + const double median = values[values.size() / 2];
|
| +
|
| + const double meanValue = accum.value();
|
| + double variance = 0;
|
| + for (const Sample& sample : samples) {
|
| + const double delta = sample.value() - meanValue;
|
| + variance += delta * delta;
|
| + }
|
| + variance /= samples.size();
|
| + // Technically, this is the relative standard deviation.
|
| + const double stddev = 100/*%*/ * sqrt(variance) / meanValue;
|
| +
|
| + printf(resultFormat, median, accum.value(), values.back(), values.front(), stddev,
|
| + Sample::metric(), values.size(), FLAGS_sampleMs, config, bench);
|
| + printf("\n");
|
| + fflush(stdout);
|
| +}
|
| +
|
| +int main(int argc, char** argv) {
|
| + SkCommandLineFlags::SetUsage("Use skpbench.py instead. "
|
| + "You usually don't want to use this program directly.");
|
| + SkCommandLineFlags::Parse(argc, argv);
|
| +
|
| + if (!FLAGS_suppressHeader) {
|
| + printf("%s\n", header);
|
| + }
|
| + if (FLAGS_samples <= 0) {
|
| + exit(0); // This can be used to print the header and quit.
|
| + }
|
| + if (0 == FLAGS_samples % 2) {
|
| + fprintf(stderr, "WARNING: even number of samples requested (%i); "
|
| + "using %i so there can be a true median.\n",
|
| + FLAGS_samples, FLAGS_samples + 1);
|
| + ++FLAGS_samples;
|
| + }
|
| +
|
| + // Parse the config.
|
| + const SkCommandLineConfigGpu* config = nullptr; // Initialize for spurious warning.
|
| + SkCommandLineConfigArray configs;
|
| + ParseConfigs(FLAGS_config, &configs);
|
| + if (configs.count() != 1 || !(config = configs[0]->asConfigGpu())) {
|
| + exitf(ExitErr::kUsage, "invalid config %s; must specify one (and only one) GPU config",
|
| + join(FLAGS_config).c_str());
|
| + }
|
| +
|
| + // Parse the skp.
|
| + if (FLAGS_skp.count() != 1) {
|
| + exitf(ExitErr::kUsage, "invalid skp \"%s\"; one (and only one) skp must be specified.",
|
| + join(FLAGS_skp).c_str());
|
| + }
|
| + const char* skpfile = FLAGS_skp[0];
|
| + std::unique_ptr<SkStream> skpstream(SkStream::MakeFromFile(skpfile));
|
| + if (!skpstream) {
|
| + exitf(ExitErr::kIO, "failed to open skp file %s", skpfile);
|
| + }
|
| + sk_sp<SkPicture> skp = SkPicture::MakeFromStream(skpstream.get());
|
| + if (!skp) {
|
| + exitf(ExitErr::kData, "failed to parse skp file %s", skpfile);
|
| + }
|
| + int width = SkTMin(SkScalarCeilToInt(skp->cullRect().width()), 2048),
|
| + height = SkTMin(SkScalarCeilToInt(skp->cullRect().height()), 2048);
|
| + if (FLAGS_verbosity >= 2 &&
|
| + (width != skp->cullRect().width() || height != skp->cullRect().height())) {
|
| + fprintf(stderr, "NOTE: %s is too large (%ix%i); cropping to %ix%i.\n",
|
| + skpfile, SkScalarCeilToInt(skp->cullRect().width()),
|
| + SkScalarCeilToInt(skp->cullRect().height()), width, height);
|
| + }
|
| +
|
| + // Create a context.
|
| + sk_gpu_test::GrContextFactory factory;
|
| + sk_gpu_test::ContextInfo ctxInfo =
|
| + factory.getContextInfo(config->getContextType(), config->getContextOptions());
|
| + GrContext* ctx = ctxInfo.grContext();
|
| + if (!ctx) {
|
| + exitf(ExitErr::kUnavailable, "failed to create context for config %s",
|
| + config->getTag().c_str());
|
| + }
|
| + if (ctx->caps()->maxRenderTargetSize() < SkTMax(width, height)) {
|
| + exitf(ExitErr::kUnavailable, "render target size %ix%i not supported by platform (max: %i)",
|
| + width, height, ctx->caps()->maxRenderTargetSize());
|
| + }
|
| + if (ctx->caps()->maxSampleCount() < config->getSamples()) {
|
| + exitf(ExitErr::kUnavailable, "sample count %i not supported by platform (max: %i)",
|
| + config->getSamples(), ctx->caps()->maxSampleCount());
|
| + }
|
| + sk_gpu_test::TestContext* testCtx = ctxInfo.testContext();
|
| + if (!testCtx) {
|
| + exitf(ExitErr::kSoftware, "testContext is null");
|
| + }
|
| + if (!testCtx->fenceSyncSupport()) {
|
| + exitf(ExitErr::kUnavailable, "GPU does not support fence sync");
|
| + }
|
| +
|
| + // Create a render target.
|
| + SkImageInfo info = SkImageInfo::Make(width, height, config->getColorType(),
|
| + kPremul_SkAlphaType, sk_ref_sp(config->getColorSpace()));
|
| + uint32_t flags = config->getUseDIText() ? SkSurfaceProps::kUseDeviceIndependentFonts_Flag : 0;
|
| + SkSurfaceProps props(flags, SkSurfaceProps::kLegacyFontHost_InitType);
|
| + sk_sp<SkSurface> surface =
|
| + SkSurface::MakeRenderTarget(ctx, SkBudgeted::kNo, info, config->getSamples(), &props);
|
| + if (!surface) {
|
| + exitf(ExitErr::kUnavailable, "failed to create %ix%i render target for config %s",
|
| + width, height, config->getTag().c_str());
|
| + }
|
| +
|
| + // Run the benchmark.
|
| + std::vector<Sample> samples;
|
| + SkCanvas* canvas = surface->getCanvas();
|
| + canvas->translate(-skp->cullRect().x(), -skp->cullRect().y());
|
| + run_benchmark(testCtx->fenceSync(), canvas, skp.get(), &samples);
|
| + print_result(samples, config->getTag().c_str(), SkOSPath::Basename(skpfile).c_str());
|
| +
|
| + // Save a proof (if one was requested).
|
| + if (!FLAGS_png.isEmpty()) {
|
| + SkBitmap bmp;
|
| + bmp.setInfo(info);
|
| + if (!surface->getCanvas()->readPixels(&bmp, 0, 0)) {
|
| + exitf(ExitErr::kUnavailable, "failed to read canvas pixels for png");
|
| + }
|
| + const SkString &dirname = SkOSPath::Dirname(FLAGS_png[0]),
|
| + &basename = SkOSPath::Basename(FLAGS_png[0]);
|
| + if (!mkdir_p(dirname)) {
|
| + exitf(ExitErr::kIO, "failed to create directory \"%s\" for png", dirname.c_str());
|
| + }
|
| + if (!sk_tools::write_bitmap_to_disk(bmp, dirname, nullptr, basename)) {
|
| + exitf(ExitErr::kIO, "failed to save png to \"%s\"", FLAGS_png[0]);
|
| + }
|
| + }
|
| +
|
| + exit(0);
|
| +}
|
| +
|
| +static void draw_skp_and_flush(SkCanvas* canvas, const SkPicture* skp) {
|
| + canvas->drawPicture(skp);
|
| + canvas->flush();
|
| +}
|
| +
|
| +static SkPlatformGpuFence insert_verified_fence(const SkGpuFenceSync* sync) {
|
| + SkPlatformGpuFence fence = sync->insertFence();
|
| + if (kInvalidPlatformGpuFence == fence) {
|
| + exitf(ExitErr::kUnavailable, "failed to insert fence");
|
| + }
|
| + return fence;
|
| +}
|
| +
|
| +static void wait_fence_and_delete(const SkGpuFenceSync* sync, SkPlatformGpuFence fence) {
|
| + if (kInvalidPlatformGpuFence == fence) {
|
| + exitf(ExitErr::kSoftware, "attempted to wait on invalid fence");
|
| + }
|
| + if (!sync->waitFence(fence)) {
|
| + exitf(ExitErr::kUnavailable, "failed to wait for fence");
|
| + }
|
| + sync->deleteFence(fence);
|
| +}
|
| +
|
| +bool mkdir_p(const SkString& dirname) {
|
| + if (dirname.isEmpty()) {
|
| + return true;
|
| + }
|
| + return mkdir_p(SkOSPath::Dirname(dirname.c_str())) && sk_mkdir(dirname.c_str());
|
| +}
|
| +
|
| +static SkString join(const SkCommandLineFlags::StringArray& stringArray) {
|
| + SkString joined;
|
| + for (int i = 0; i < FLAGS_config.count(); ++i) {
|
| + joined.appendf(i ? " %s" : "%s", FLAGS_config[i]);
|
| + }
|
| + return joined;
|
| +}
|
| +
|
| +static void exitf(ExitErr err, const char* format, ...) {
|
| + fprintf(stderr, ExitErr::kSoftware == err ? "INTERNAL ERROR: " : "ERROR: ");
|
| + va_list args;
|
| + va_start(args, format);
|
| + vfprintf(stderr, format, args);
|
| + va_end(args);
|
| + fprintf(stderr, ExitErr::kSoftware == err ? "; this should never happen.\n": ".\n");
|
| + exit((int)err);
|
| +}
|
|
|