Index: tools/bench_record.cpp |
diff --git a/tools/bench_record.cpp b/tools/bench_record.cpp |
index 025127e4c28f0e8260fc1ab717156840ece2a401..a8d7a8a0e5d7535fb95a3a384174e782abc1c974 100644 |
--- a/tools/bench_record.cpp |
+++ b/tools/bench_record.cpp |
@@ -5,7 +5,6 @@ |
* found in the LICENSE file. |
*/ |
-#include "BenchTimer.h" |
#include "SkCommandLineFlags.h" |
#include "SkForceLinking.h" |
#include "SkGraphics.h" |
@@ -15,28 +14,32 @@ |
#include "SkRecording.h" |
#include "SkStream.h" |
#include "SkString.h" |
+ |
+#include "BenchTimer.h" |
#include "LazyDecodeBitmap.h" |
+#include "Stats.h" |
-__SK_FORCE_IMAGE_DECODER_LINKING; |
+typedef WallTimer Timer; |
-// Just reading all the SKPs takes about 2 seconds for me, which is the same as about 100 loops of |
-// rerecording all the SKPs. So we default to --loops=900, which makes ~90% of our time spent in |
-// recording, and this should take ~20 seconds to run. |
+__SK_FORCE_IMAGE_DECODER_LINKING; |
DEFINE_string2(skps, r, "skps", "Directory containing SKPs to read and re-record."); |
-DEFINE_int32(loops, 900, "Number of times to re-record each SKP."); |
-DEFINE_bool(endRecording, true, "If false, don't time SkPicture::endRecording()"); |
-DEFINE_int32(nullSize, 1000, "Pretend dimension of null source picture."); |
+DEFINE_int32(samples, 10, "Number of times to re-record each SKP."); |
DEFINE_int32(tileGridSize, 512, "Set the tile grid size. Has no effect if bbh is not set to tilegrid."); |
DEFINE_string(bbh, "", "Turn on the bbh and select the type, one of rtree, tilegrid, quadtree"); |
DEFINE_bool(skr, false, "Record SKR instead of SKP."); |
DEFINE_string(match, "", "The usual filters on file names of SKPs to bench."); |
DEFINE_string(timescale, "us", "Print times in ms, us, or ns"); |
- |
-static double scale_time(double ms) { |
- if (FLAGS_timescale.contains("us")) ms *= 1000; |
- if (FLAGS_timescale.contains("ns")) ms *= 1000000; |
- return ms; |
+DEFINE_double(overheadGoal, 0.0001, |
+ "Try to make timer overhead at most this fraction of our sample measurements."); |
+DEFINE_int32(verbose, 0, "0: print min sample; " |
+ "1: print min, mean, max and noise indication " |
+ "2: print all samples"); |
+ |
+static double timescale() { |
+ if (FLAGS_timescale.contains("us")) return 1000; |
+ if (FLAGS_timescale.contains("ns")) return 1000000; |
+ return 1; |
} |
static SkBBHFactory* parse_FLAGS_bbh() { |
@@ -61,35 +64,62 @@ static SkBBHFactory* parse_FLAGS_bbh() { |
return NULL; |
} |
-static void bench_record(SkPicture* src, const char* name, SkBBHFactory* bbhFactory) { |
- BenchTimer timer; |
- timer.start(); |
- const int width = src ? src->width() : FLAGS_nullSize; |
- const int height = src ? src->height() : FLAGS_nullSize; |
- |
- for (int i = 0; i < FLAGS_loops; i++) { |
- if (FLAGS_skr) { |
- EXPERIMENTAL::SkRecording recording(width, height); |
- if (NULL != src) { |
- src->draw(recording.canvas()); |
- } |
- // Release and delete the SkPlayback so that recording optimizes its SkRecord. |
- SkDELETE(recording.releasePlayback()); |
- } else { |
- SkPictureRecorder recorder; |
- SkCanvas* canvas = recorder.beginRecording(width, height, bbhFactory); |
- if (NULL != src) { |
- src->draw(canvas); |
- } |
- if (FLAGS_endRecording) { |
- SkAutoTUnref<SkPicture> dst(recorder.endRecording()); |
- } |
+static void rerecord(const SkPicture& src, SkBBHFactory* bbhFactory) { |
+ if (FLAGS_skr) { |
+ EXPERIMENTAL::SkRecording recording(src.width(), src.height()); |
+ src.draw(recording.canvas()); |
+ // Release and delete the SkPlayback so that recording optimizes its SkRecord. |
+ SkDELETE(recording.releasePlayback()); |
+ } else { |
+ SkPictureRecorder recorder; |
+ src.draw(recorder.beginRecording(src.width(), src.height(), bbhFactory)); |
+ SkAutoTUnref<SkPicture> dst(recorder.endRecording()); |
+ } |
+} |
+ |
+static void bench_record(const SkPicture& src, |
+ const double timerOverhead, |
+ const char* name, |
+ SkBBHFactory* bbhFactory) { |
+ // Rerecord once to warm up any caches. Otherwise the first sample can be very noisy. |
+ rerecord(src, bbhFactory); |
+ |
+ // Rerecord once to see how many times we should loop to make timer overhead insignificant. |
+ Timer timer; |
+ do { |
+ timer.start(timescale()); |
+ rerecord(src, bbhFactory); |
+ timer.end(); |
+ } while (timer.fWall < timerOverhead); // Loop just in case something bizarre happens. |
+ |
+ // We want (timer overhead / measurement) to be less than FLAGS_overheadGoal. |
+ // So in each sample, we'll loop enough times to have made that true for our first measurement. |
+ const int loops = (int)ceil(timerOverhead / timer.fWall / FLAGS_overheadGoal); |
+ |
+ SkAutoTMalloc<double> samples(FLAGS_samples); |
+ for (int i = 0; i < FLAGS_samples; i++) { |
+ timer.start(timescale()); |
+ for (int j = 0; j < loops; j++) { |
+ rerecord(src, bbhFactory); |
} |
+ timer.end(); |
+ samples[i] = timer.fWall / loops; |
} |
- timer.end(); |
- const double msPerLoop = timer.fCpu / (double)FLAGS_loops; |
- printf("%f\t%s\n", scale_time(msPerLoop), name); |
+ Stats stats(samples.get(), FLAGS_samples); |
+ if (FLAGS_verbose == 0) { |
+ printf("%g\t%s\n", stats.min, name); |
+ } else if (FLAGS_verbose == 1) { |
+ // Get a rough idea of how noisy the measurements were. |
+ const double noisePercent = 100 * sqrt(stats.var) / stats.mean; |
+ printf("%g\t%g\t%g\t±%.0f%%\t%s\n", stats.min, stats.mean, stats.max, noisePercent, name); |
+ } else if (FLAGS_verbose == 2) { |
+ printf("%s", name); |
+ for (int i = 0; i < FLAGS_samples; i++) { |
+ printf("\t%g", samples[i]); |
+ } |
+ printf("\n"); |
+ } |
} |
int tool_main(int argc, char** argv); |
@@ -103,10 +133,17 @@ int tool_main(int argc, char** argv) { |
} |
SkAutoTDelete<SkBBHFactory> bbhFactory(parse_FLAGS_bbh()); |
- bench_record(NULL, "NULL", bbhFactory.get()); |
- if (FLAGS_skps.isEmpty()) { |
- return 0; |
+ |
+ // Each run will use this timer overhead estimate to guess how many times it should run. |
+ static const int kOverheadLoops = 10000000; |
+ Timer timer; |
+ double overheadEstimate = 0.0; |
+ for (int i = 0; i < kOverheadLoops; i++) { |
+ timer.start(timescale()); |
+ timer.end(); |
+ overheadEstimate += timer.fWall; |
} |
+ overheadEstimate /= kOverheadLoops; |
SkOSFile::Iter it(FLAGS_skps[0], ".skp"); |
SkString filename; |
@@ -131,7 +168,7 @@ int tool_main(int argc, char** argv) { |
failed = true; |
continue; |
} |
- bench_record(src, filename.c_str(), bbhFactory.get()); |
+ bench_record(*src, overheadEstimate, filename.c_str(), bbhFactory.get()); |
} |
return failed ? 1 : 0; |
} |