Index: gpu/perftests/texture_upload_perftest.cc |
diff --git a/gpu/perftests/texture_upload_perftest.cc b/gpu/perftests/texture_upload_perftest.cc |
index 5f767461cf1bdd5f913d50957b4a383125a4dd4b..e36fb1b2910ef6d36fcea21694b100e75deada49 100644 |
--- a/gpu/perftests/texture_upload_perftest.cc |
+++ b/gpu/perftests/texture_upload_perftest.cc |
@@ -11,11 +11,14 @@ |
#include "base/memory/scoped_ptr.h" |
#include "base/strings/stringprintf.h" |
#include "gpu/perftests/measurements.h" |
+#include "testing/gmock/include/gmock/gmock.h" |
#include "testing/gtest/include/gtest/gtest.h" |
#include "testing/perf/perf_test.h" |
#include "ui/gfx/geometry/size.h" |
+#include "ui/gfx/geometry/vector2d_f.h" |
#include "ui/gl/gl_bindings.h" |
#include "ui/gl/gl_context.h" |
+#include "ui/gl/gl_enums.h" |
#include "ui/gl/gl_surface.h" |
#include "ui/gl/gpu_timing.h" |
#include "ui/gl/scoped_make_current.h" |
@@ -31,11 +34,13 @@ const int kUploadPerfTestRuns = 100; |
// clang-format off |
const char kVertexShader[] = |
SHADER( |
+ uniform vec2 translation = vec2(0.0, 0.0); |
attribute vec2 a_position; |
attribute vec2 a_texCoord; |
varying vec2 v_texCoord; |
void main() { |
- gl_Position = vec4(a_position.x, a_position.y, 0.0, 1.0); |
+ gl_Position = vec4( |
+ translation.x + a_position.x, translation.y + a_position.y, 0.0, 1.0); |
v_texCoord = a_texCoord; |
} |
); |
@@ -77,18 +82,55 @@ GLuint LoadShader(const GLenum type, const char* const src) { |
} |
void GenerateTextureData(const gfx::Size& size, |
+ int bytes_per_pixel, |
const int seed, |
std::vector<uint8>* const pixels) { |
- pixels->resize(size.GetArea() * 4); |
- for (int y = 0; y < size.height(); ++y) { |
- for (int x = 0; x < size.width(); ++x) { |
- const size_t offset = (y * size.width() + x) * 4; |
- pixels->at(offset) = (y + seed) % 64; |
- pixels->at(offset + 1) = (x + seed) % 128; |
- pixels->at(offset + 2) = (y + x + seed) % 256; |
- pixels->at(offset + 3) = 255; |
+ int bytes = size.GetArea() * bytes_per_pixel; |
+ pixels->resize(bytes); |
+ for (int i = 0; i < bytes; ++i) { |
+ int channel = i % bytes_per_pixel; |
+ if (channel == 3) { // Alpha channel. |
+ pixels->at(i) = 255; |
+ } else { |
+ pixels->at(i) = (i + (seed << 2)) % (32 << channel); |
+ } |
+ } |
+} |
+ |
+// Compare a buffer containing pixels in a specified format to GL_RGBA buffer |
+// where the former buffer have been uploaded as a texture and drawn on the |
+// RGBA buffer. |
+bool CompareBufferToRGBABuffer(GLenum format, |
+ const std::vector<uint8>& pixels, |
+ const std::vector<uint8>& pixels_rgba) { |
+ for (size_t i = 0; i < pixels.size(); i += 4) { |
+ switch (format) { |
+ case GL_RED_EXT: // (R_t, 0, 0, 1) |
+ if (pixels_rgba[i] != pixels[i / 4] || pixels_rgba[i + 1] != 0 || |
+ pixels_rgba[i + 2] != 0 || pixels_rgba[i + 3] != 255) { |
+ return false; |
+ } |
+ break; |
+ case GL_LUMINANCE: // (L_t, L_t, L_t, 1) |
+ if (pixels_rgba[i] != pixels[i / 4] || |
+ pixels_rgba[i + 1] != pixels[i / 4] || |
+ pixels_rgba[i + 2] != pixels[i / 4] || pixels_rgba[i + 3] != 255) { |
+ return false; |
+ } |
+ break; |
+ case GL_RGBA: // (R_t, G_t, B_t, A_t) |
+ if (pixels_rgba[i] != pixels[i] || |
+ pixels_rgba[i + 1] != pixels[i + 1] || |
+ pixels_rgba[i + 2] != pixels[i + 2] || |
+ pixels_rgba[i + 3] != pixels[i + 3]) { |
+ return false; |
+ } |
+ break; |
+ default: |
+ NOTREACHED(); |
} |
} |
+ return true; |
} |
// PerfTest to check costs of texture upload at different stages |
@@ -99,8 +141,9 @@ class TextureUploadPerfTest : public testing::Test { |
// Overridden from testing::Test |
void SetUp() override { |
+ static bool gl_initialized = gfx::GLSurface::InitializeOneOff(); |
+ DCHECK(gl_initialized); |
// Initialize an offscreen surface and a gl context. |
- gfx::GLSurface::InitializeOneOff(); |
surface_ = gfx::GLSurface::CreateOffscreenGLSurface(gfx::Size(4, 4)); |
gl_context_ = gfx::GLContext::CreateGLContext(NULL, // share_group |
surface_.get(), |
@@ -146,15 +189,28 @@ class TextureUploadPerfTest : public testing::Test { |
glBindAttribLocation(program_object_, 1, "a_texCoord"); |
glLinkProgram(program_object_); |
+ translation_location_ = |
+ glGetUniformLocation(program_object_, "translation"); |
+ DCHECK_NE(-1, translation_location_); |
+ |
GLint linked = -1; |
glGetProgramiv(program_object_, GL_LINK_STATUS, &linked); |
CHECK_NE(0, linked); |
+ glUseProgram(program_object_); |
+ glUniform1i(sampler_location_, 0); |
sampler_location_ = glGetUniformLocation(program_object_, "a_texture"); |
CHECK_NE(-1, sampler_location_); |
glGenBuffersARB(1, &vertex_buffer_); |
CHECK_NE(0u, vertex_buffer_); |
+ DCHECK_NE(0u, vertex_buffer_); |
+ glBindBuffer(GL_ARRAY_BUFFER, vertex_buffer_); |
+ glVertexAttribPointer(0, 2, GL_FLOAT, GL_FALSE, sizeof(GLfloat) * 4, 0); |
+ glVertexAttribPointer(1, 2, GL_FLOAT, GL_FALSE, sizeof(GLfloat) * 4, |
+ reinterpret_cast<void*>(sizeof(GLfloat) * 2)); |
+ glEnableVertexAttribArray(0); |
+ glEnableVertexAttribArray(1); |
CheckNoGlError(); |
} |
@@ -176,7 +232,6 @@ class TextureUploadPerfTest : public testing::Test { |
-1.f, top, 0.f, 1.f, |
right, top, 1.f, 1.f}; |
// clang-format on |
- |
glBufferData(GL_ARRAY_BUFFER, sizeof(data), data, GL_STATIC_DRAW); |
CheckNoGlError(); |
} |
@@ -199,41 +254,39 @@ class TextureUploadPerfTest : public testing::Test { |
} |
protected: |
- // Upload and draw on the offscren surface. |
- // Return a list of pair. Each pair describe a gl operation and the wall |
- // time elapsed in milliseconds. |
- std::vector<Measurement> UploadAndDraw(const gfx::Size& size, |
- const std::vector<uint8>& pixels, |
- const GLenum format, |
- const GLenum type) { |
- MeasurementTimers total_timers(gpu_timing_client_.get()); |
+ GLuint CreateGLTexture() { |
GLuint texture_id = 0; |
- |
- MeasurementTimers tex_timers(gpu_timing_client_.get()); |
glActiveTexture(GL_TEXTURE0); |
glGenTextures(1, &texture_id); |
glBindTexture(GL_TEXTURE_2D, texture_id); |
+ return texture_id; |
+ } |
+ void UploadTexture(GLuint texture_id, |
+ const gfx::Size& size, |
+ const std::vector<uint8>& pixels, |
+ GLenum format) { |
glTexImage2D(GL_TEXTURE_2D, 0, format, size.width(), size.height(), 0, |
- format, type, &pixels[0]); |
+ format, GL_UNSIGNED_BYTE, &pixels[0]); |
glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_MIN_FILTER, GL_NEAREST); |
glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_MAG_FILTER, GL_NEAREST); |
glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_WRAP_S, GL_CLAMP_TO_EDGE); |
glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_WRAP_T, GL_CLAMP_TO_EDGE); |
CheckNoGlError(); |
+ } |
+ |
+ // Upload and draw on the offscren surface. |
+ // Return a list of pair. Each pair describe a gl operation and the wall |
+ // time elapsed in milliseconds. |
+ std::vector<Measurement> UploadAndDraw(const gfx::Size& size, |
+ const std::vector<uint8>& pixels, |
+ const GLenum format) { |
+ GLuint texture_id = CreateGLTexture(); |
+ MeasurementTimers tex_timers(gpu_timing_client_.get()); |
+ UploadTexture(texture_id, size, pixels, format); |
tex_timers.Record(); |
MeasurementTimers draw_timers(gpu_timing_client_.get()); |
- glUseProgram(program_object_); |
- glUniform1i(sampler_location_, 0); |
- |
- DCHECK_NE(0u, vertex_buffer_); |
- glBindBuffer(GL_ARRAY_BUFFER, vertex_buffer_); |
- glVertexAttribPointer(0, 2, GL_FLOAT, GL_FALSE, sizeof(GLfloat) * 4, 0); |
- glVertexAttribPointer(1, 2, GL_FLOAT, GL_FALSE, sizeof(GLfloat) * 4, |
- reinterpret_cast<void*>(sizeof(GLfloat) * 2)); |
- glEnableVertexAttribArray(0); |
- glEnableVertexAttribArray(1); |
glDrawArrays(GL_TRIANGLE_STRIP, 0, 4); |
draw_timers.Record(); |
@@ -242,26 +295,21 @@ class TextureUploadPerfTest : public testing::Test { |
glFinish(); |
CheckNoGlError(); |
finish_timers.Record(); |
- total_timers.Record(); |
glDeleteTextures(1, &texture_id); |
std::vector<uint8> pixels_rendered(size.GetArea() * 4); |
- glReadPixels(0, 0, size.width(), size.height(), GL_RGBA, type, |
+ glReadPixels(0, 0, size.width(), size.height(), GL_RGBA, GL_UNSIGNED_BYTE, |
&pixels_rendered[0]); |
CheckNoGlError(); |
- |
- // TODO(dcastagna): don't assume the format of the texture and do |
- // the appropriate format conversion. |
- EXPECT_EQ(static_cast<GLenum>(GL_RGBA), format); |
- EXPECT_EQ(pixels, pixels_rendered); |
+ EXPECT_TRUE(CompareBufferToRGBABuffer(format, pixels, pixels_rendered)) |
+ << "Format is: " << gfx::GLEnums::GetStringEnum(format); |
std::vector<Measurement> measurements; |
bool gpu_timer_errors = |
gpu_timing_client_->IsAvailable() && |
gpu_timing_client_->CheckAndResetTimerErrors(); |
if (!gpu_timer_errors) { |
- measurements.push_back(total_timers.GetAsMeasurement("total")); |
measurements.push_back(tex_timers.GetAsMeasurement("teximage2d")); |
measurements.push_back(draw_timers.GetAsMeasurement("drawarrays")); |
measurements.push_back(finish_timers.GetAsMeasurement("finish")); |
@@ -269,14 +317,16 @@ class TextureUploadPerfTest : public testing::Test { |
return measurements; |
} |
- void RunUploadAndDrawMultipleTimes(const gfx::Size& size) { |
+ void RunUploadAndDrawMultipleTimes(const gfx::Size& size, |
+ const GLenum format) { |
std::vector<uint8> pixels; |
base::SmallMap<std::map<std::string, Measurement>> |
aggregates; // indexed by name |
int successful_runs = 0; |
+ ASSERT_THAT(format, testing::AnyOf(GL_RGBA, GL_LUMINANCE, GL_RED_EXT)); |
for (int i = 0; i < kUploadPerfWarmupRuns + kUploadPerfTestRuns; ++i) { |
- GenerateTextureData(size, i + 1, &pixels); |
- auto run = UploadAndDraw(size, pixels, GL_RGBA, GL_UNSIGNED_BYTE); |
+ GenerateTextureData(size, format == GL_RGBA ? 4 : 1, i + 1, &pixels); |
+ auto run = UploadAndDraw(size, pixels, format); |
if (i < kUploadPerfWarmupRuns || !run.size()) { |
continue; |
} |
@@ -287,13 +337,15 @@ class TextureUploadPerfTest : public testing::Test { |
aggregate.Increment(measurement); |
} |
} |
+ std::string suffix = base::StringPrintf( |
+ "_%d_%s", size.width(), gfx::GLEnums::GetStringEnum(format).c_str()); |
if (successful_runs) { |
for (const auto& entry : aggregates) { |
const auto m = entry.second.Divide(successful_runs); |
- m.PrintResult(base::StringPrintf("_%d", size.width())); |
+ m.PrintResult(suffix); |
} |
} |
- perf_test::PrintResult("sample_runs", "", "", |
+ perf_test::PrintResult("sample_runs", suffix, "", |
static_cast<size_t>(successful_runs), "laps", true); |
} |
@@ -308,6 +360,7 @@ class TextureUploadPerfTest : public testing::Test { |
GLuint fragment_shader_ = 0; |
GLuint program_object_ = 0; |
GLint sampler_location_ = -1; |
+ GLint translation_location_ = -1; |
GLuint vertex_buffer_ = 0; |
}; |
@@ -315,18 +368,95 @@ class TextureUploadPerfTest : public testing::Test { |
// and prints out aggregated measurements for all the runs. |
TEST_F(TextureUploadPerfTest, glTexImage2d) { |
int sizes[] = {128, 256, 512, 1024}; |
+ std::vector<GLenum> formats; |
+ formats.push_back(GL_RGBA); |
+ // Used by default for ResourceProvider::yuv_resource_format_. |
+ formats.push_back(GL_LUMINANCE); |
+ |
+ ui::ScopedMakeCurrent smc(gl_context_.get(), surface_.get()); |
+ bool has_texture_rg = gl_context_->HasExtension("GL_EXT_texture_rg") || |
+ gl_context_->HasExtension("GL_ARB_texture_rg"); |
+ |
+ if (has_texture_rg) { |
+ // Used as ResourceProvider::yuv_resource_format_ if |
+ // {ARB,EXT}_texture_rg is available. |
+ formats.push_back(GL_RED_EXT); |
+ } |
for (int side : sizes) { |
ASSERT_GE(fbo_size_.width(), side); |
ASSERT_GE(fbo_size_.height(), side); |
- |
gfx::Size size(side, side); |
- ui::ScopedMakeCurrent smc(gl_context_.get(), surface_.get()); |
GenerateVertexBuffer(size); |
+ for (GLenum format : formats) { |
+ RunUploadAndDrawMultipleTimes(size, format); |
+ } |
+ } |
+} |
- DCHECK_NE(0u, framebuffer_object_); |
- glBindFramebufferEXT(GL_FRAMEBUFFER, framebuffer_object_); |
+// Perf test to check if the driver is doing texture renaming. |
+// This test creates one GL texture_id and four different images. For |
+// every image it uploads it using texture_id and it draws multiple |
+// times. The cpu/wall time and the gpu time for all the uploads and |
+// draws, but before glFinish, is computed and is printed out at the end as |
+// "upload_and_draw". If the gpu time is >> than the cpu/wall time we expect the |
+// driver to do texture renaming: this means that while the gpu is drawing using |
+// texture_id it didn't block cpu side the texture upload using the same |
+// texture_id. |
+TEST_F(TextureUploadPerfTest, renaming) { |
+ gfx::Size texture_size(fbo_size_.width() / 2, fbo_size_.height() / 2); |
+ |
+ std::vector<uint8> pixels[4]; |
+ for (int i = 0; i < 4; ++i) { |
+ GenerateTextureData(texture_size, 4, i + 1, &pixels[i]); |
+ } |
+ |
+ ui::ScopedMakeCurrent smc(gl_context_.get(), surface_.get()); |
+ GenerateVertexBuffer(texture_size); |
+ |
+ gfx::Vector2dF positions[] = {gfx::Vector2dF(0.f, 0.f), |
+ gfx::Vector2dF(1.f, 0.f), |
+ gfx::Vector2dF(0.f, 1.f), |
+ gfx::Vector2dF(1.f, 1.f)}; |
+ GLuint texture_id = CreateGLTexture(); |
+ |
+ MeasurementTimers upload_and_draw_timers(gpu_timing_client_.get()); |
+ |
+ for (int i = 0; i < 4; ++i) { |
+ UploadTexture(texture_id, texture_size, pixels[i % 4], GL_RGBA); |
+ DCHECK_NE(-1, translation_location_); |
+ glUniform2f(translation_location_, positions[i % 4].x(), |
+ positions[i % 4].y()); |
+ // Draw the same quad multiple times to make sure that the time spent on the |
+ // gpu is more than the cpu time. |
+ for (int draw = 0; draw < 128; ++draw) { |
+ glDrawArrays(GL_TRIANGLE_STRIP, 0, 4); |
+ } |
+ } |
+ |
+ upload_and_draw_timers.Record(); |
+ MeasurementTimers finish_timers(gpu_timing_client_.get()); |
+ glFinish(); |
+ CheckNoGlError(); |
+ finish_timers.Record(); |
+ |
+ glDeleteTextures(1, &texture_id); |
+ |
+ for (int i = 0; i < 4; ++i) { |
+ std::vector<uint8> pixels_rendered(texture_size.GetArea() * 4); |
+ glReadPixels(texture_size.width() * positions[i].x(), |
+ texture_size.height() * positions[i].y(), texture_size.width(), |
+ texture_size.height(), GL_RGBA, GL_UNSIGNED_BYTE, |
+ &pixels_rendered[0]); |
+ CheckNoGlError(); |
+ ASSERT_EQ(pixels[i].size(), pixels_rendered.size()); |
+ EXPECT_EQ(pixels[i], pixels_rendered); |
+ } |
- RunUploadAndDrawMultipleTimes(size); |
+ bool gpu_timer_errors = gpu_timing_client_->IsAvailable() && |
+ gpu_timing_client_->CheckAndResetTimerErrors(); |
+ if (!gpu_timer_errors) { |
+ upload_and_draw_timers.GetAsMeasurement("upload_and_draw").PrintResult(""); |
+ finish_timers.GetAsMeasurement("finish").PrintResult(""); |
} |
} |