Index: src/gpu/effects/GrConvolutionEffect.cpp |
diff --git a/src/gpu/effects/GrConvolutionEffect.cpp b/src/gpu/effects/GrConvolutionEffect.cpp |
index 72640824d2591f4b60e02186aab5d0add0f1d161..a39171818b35e4ace0a618ec80ab97be327a1d30 100644 |
--- a/src/gpu/effects/GrConvolutionEffect.cpp |
+++ b/src/gpu/effects/GrConvolutionEffect.cpp |
@@ -13,9 +13,73 @@ |
// For brevity |
typedef GrGLProgramDataManager::UniformHandle UniformHandle; |
+/** |
+ * Base class with shared functionality for GrGLBoundedConvolutionEffect and |
+ * GrGLBilerpConvolutionEffect. |
+ */ |
class GrGLConvolutionEffect : public GrGLFragmentProcessor { |
public: |
GrGLConvolutionEffect(const GrProcessor&); |
+ static inline void GenKey(const GrProcessor&, const GrGLSLCaps&, GrProcessorKeyBuilder*); |
+ |
+protected: |
+ int radius() const { return fRadius; } |
+ int width() const { return Gr1DKernelEffect::WidthFromRadius(fRadius); } |
+ Gr1DKernelEffect::Direction direction() const { return fDirection; } |
+ void getImageIncrement(const GrConvolutionEffect&, float (*)[2]) const; |
+ |
+private: |
+ int fRadius; |
+ Gr1DKernelEffect::Direction fDirection; |
+ |
+ typedef GrGLFragmentProcessor INHERITED; |
+}; |
+ |
+GrGLConvolutionEffect::GrGLConvolutionEffect(const GrProcessor& processor) { |
+ const GrConvolutionEffect& c = processor.cast<GrConvolutionEffect>(); |
+ fRadius = c.radius(); |
+ fDirection = c.direction(); |
+} |
+ |
+void GrGLConvolutionEffect::GenKey(const GrProcessor& processor, |
+ const GrGLSLCaps&, |
+ GrProcessorKeyBuilder* b) { |
+ const GrConvolutionEffect& conv = processor.cast<GrConvolutionEffect>(); |
+ uint32_t key = conv.radius(); |
+ key <<= 2; |
+ if (conv.useBounds()) { |
+ key |= 0x2; |
+ key |= GrConvolutionEffect::kY_Direction == conv.direction() ? 0x1 : 0x0; |
+ } |
+ b->add32(key); |
+} |
+ |
+void GrGLConvolutionEffect::getImageIncrement(const GrConvolutionEffect& conv, |
+ float (*imageIncrement)[2]) const { |
+ GrTexture& texture = *conv.texture(0); |
+ (*imageIncrement)[0] = (*imageIncrement)[1] = 0; |
+ float ySign = texture.origin() != kTopLeft_GrSurfaceOrigin ? 1.0f : -1.0f; |
+ switch (conv.direction()) { |
+ case Gr1DKernelEffect::kX_Direction: |
+ (*imageIncrement)[0] = 1.0f / texture.width(); |
+ break; |
+ case Gr1DKernelEffect::kY_Direction: |
+ (*imageIncrement)[1] = ySign / texture.height(); |
+ break; |
+ default: |
+ SkFAIL("Unknown filter direction."); |
+ } |
+} |
+ |
+/////////////////////////////////////////////////////////////////////////////// |
+ |
+/** |
+ * Applies a convolution effect which restricts samples to the provided bounds |
+ * using shader logic. |
+ */ |
+class GrGLBoundedConvolutionEffect : public GrGLConvolutionEffect { |
+public: |
+ GrGLBoundedConvolutionEffect(const GrProcessor& processor) : INHERITED(processor) {} |
virtual void emitCode(GrGLFPBuilder*, |
const GrFragmentProcessor&, |
@@ -26,47 +90,29 @@ public: |
void setData(const GrGLProgramDataManager& pdman, const GrProcessor&) override; |
- static inline void GenKey(const GrProcessor&, const GrGLSLCaps&, GrProcessorKeyBuilder*); |
- |
private: |
- int width() const { return Gr1DKernelEffect::WidthFromRadius(fRadius); } |
- bool useBounds() const { return fUseBounds; } |
- Gr1DKernelEffect::Direction direction() const { return fDirection; } |
- |
- int fRadius; |
- bool fUseBounds; |
- Gr1DKernelEffect::Direction fDirection; |
UniformHandle fKernelUni; |
UniformHandle fImageIncrementUni; |
UniformHandle fBoundsUni; |
- typedef GrGLFragmentProcessor INHERITED; |
+ typedef GrGLConvolutionEffect INHERITED; |
}; |
-GrGLConvolutionEffect::GrGLConvolutionEffect(const GrProcessor& processor) { |
- const GrConvolutionEffect& c = processor.cast<GrConvolutionEffect>(); |
- fRadius = c.radius(); |
- fUseBounds = c.useBounds(); |
- fDirection = c.direction(); |
-} |
+void GrGLBoundedConvolutionEffect::emitCode(GrGLFPBuilder* builder, |
+ const GrFragmentProcessor& processor, |
+ const char* outputColor, |
+ const char* inputColor, |
+ const TransformedCoordsArray& coords, |
+ const TextureSamplerArray& samplers) { |
+ fImageIncrementUni = |
+ builder->addUniform(GrGLProgramBuilder::kFragment_Visibility, kVec2f_GrSLType, |
+ kDefault_GrSLPrecision, "ImageIncrement"); |
-void GrGLConvolutionEffect::emitCode(GrGLFPBuilder* builder, |
- const GrFragmentProcessor&, |
- const char* outputColor, |
- const char* inputColor, |
- const TransformedCoordsArray& coords, |
- const TextureSamplerArray& samplers) { |
- fImageIncrementUni = builder->addUniform(GrGLProgramBuilder::kFragment_Visibility, |
- kVec2f_GrSLType, kDefault_GrSLPrecision, |
- "ImageIncrement"); |
- if (this->useBounds()) { |
- fBoundsUni = builder->addUniform(GrGLProgramBuilder::kFragment_Visibility, |
- kVec2f_GrSLType, kDefault_GrSLPrecision, |
- "Bounds"); |
- } |
- fKernelUni = builder->addUniformArray(GrGLProgramBuilder::kFragment_Visibility, |
- kFloat_GrSLType, kDefault_GrSLPrecision, |
- "Kernel", this->width()); |
+ fBoundsUni = builder->addUniform(GrGLProgramBuilder::kFragment_Visibility, kVec2f_GrSLType, |
+ kDefault_GrSLPrecision, "Bounds"); |
+ |
+ fKernelUni = builder->addUniformArray(GrGLProgramBuilder::kFragment_Visibility, kFloat_GrSLType, |
+ kDefault_GrSLPrecision, "Kernel", this->width()); |
GrGLFragmentBuilder* fsBuilder = builder->getFragmentShaderBuilder(); |
SkString coords2D = fsBuilder->ensureFSCoords2D(coords, 0); |
@@ -77,7 +123,8 @@ void GrGLConvolutionEffect::emitCode(GrGLFPBuilder* builder, |
const GrGLShaderVar& kernel = builder->getUniformVariable(fKernelUni); |
const char* imgInc = builder->getUniformCStr(fImageIncrementUni); |
- fsBuilder->codeAppendf("\t\tvec2 coord = %s - %d.0 * %s;\n", coords2D.c_str(), fRadius, imgInc); |
+ fsBuilder->codeAppendf("\t\tvec2 coord = %s - %d.0 * %s;\n", coords2D.c_str(), this->radius(), |
+ imgInc); |
// Manually unroll loop because some drivers don't; yields 20-30% speedup. |
for (int i = 0; i < width; i++) { |
@@ -87,12 +134,10 @@ void GrGLConvolutionEffect::emitCode(GrGLFPBuilder* builder, |
kernel.appendArrayAccess(index.c_str(), &kernelIndex); |
fsBuilder->codeAppendf("\t\t%s += ", outputColor); |
fsBuilder->appendTextureLookup(samplers[0], "coord"); |
- if (this->useBounds()) { |
- const char* bounds = builder->getUniformCStr(fBoundsUni); |
- const char* component = this->direction() == Gr1DKernelEffect::kY_Direction ? "y" : "x"; |
- fsBuilder->codeAppendf(" * float(coord.%s >= %s.x && coord.%s <= %s.y)", |
- component, bounds, component, bounds); |
- } |
+ const char* bounds = builder->getUniformCStr(fBoundsUni); |
+ const char* component = this->direction() == Gr1DKernelEffect::kY_Direction ? "y" : "x"; |
+ fsBuilder->codeAppendf(" * float(coord.%s >= %s.x && coord.%s <= %s.y)", component, bounds, |
+ component, bounds); |
fsBuilder->codeAppendf(" * %s;\n", kernelIndex.c_str()); |
fsBuilder->codeAppendf("\t\tcoord += %s;\n", imgInc); |
} |
@@ -102,47 +147,155 @@ void GrGLConvolutionEffect::emitCode(GrGLFPBuilder* builder, |
fsBuilder->codeAppend(modulate.c_str()); |
} |
-void GrGLConvolutionEffect::setData(const GrGLProgramDataManager& pdman, |
- const GrProcessor& processor) { |
+void GrGLBoundedConvolutionEffect::setData(const GrGLProgramDataManager& pdman, |
+ const GrProcessor& processor) { |
const GrConvolutionEffect& conv = processor.cast<GrConvolutionEffect>(); |
- GrTexture& texture = *conv.texture(0); |
+ |
// the code we generated was for a specific kernel radius |
- SkASSERT(conv.radius() == fRadius); |
- float imageIncrement[2] = { 0 }; |
- float ySign = texture.origin() != kTopLeft_GrSurfaceOrigin ? 1.0f : -1.0f; |
- switch (conv.direction()) { |
- case Gr1DKernelEffect::kX_Direction: |
- imageIncrement[0] = 1.0f / texture.width(); |
- break; |
- case Gr1DKernelEffect::kY_Direction: |
- imageIncrement[1] = ySign / texture.height(); |
- break; |
- default: |
- SkFAIL("Unknown filter direction."); |
- } |
+ SkASSERT(conv.radius() == this->radius()); |
+ |
+ // the code we generated was for a specific bounding mode. |
+ SkASSERT(conv.useBounds() == true); |
+ |
+ GrTexture& texture = *conv.texture(0); |
+ float imageIncrement[2]; |
+ getImageIncrement(conv, &imageIncrement); |
pdman.set2fv(fImageIncrementUni, 1, imageIncrement); |
- if (conv.useBounds()) { |
- const float* bounds = conv.bounds(); |
- if (Gr1DKernelEffect::kY_Direction == conv.direction() && |
- texture.origin() != kTopLeft_GrSurfaceOrigin) { |
- pdman.set2f(fBoundsUni, 1.0f - bounds[1], 1.0f - bounds[0]); |
- } else { |
- pdman.set2f(fBoundsUni, bounds[0], bounds[1]); |
- } |
+ const float* bounds = conv.bounds(); |
+ if (Gr1DKernelEffect::kY_Direction == conv.direction() && |
+ texture.origin() != kTopLeft_GrSurfaceOrigin) { |
+ pdman.set2f(fBoundsUni, 1.0f - bounds[1], 1.0f - bounds[0]); |
+ } else { |
+ pdman.set2f(fBoundsUni, bounds[0], bounds[1]); |
} |
pdman.set1fv(fKernelUni, this->width(), conv.kernel()); |
} |
-void GrGLConvolutionEffect::GenKey(const GrProcessor& processor, const GrGLSLCaps&, |
- GrProcessorKeyBuilder* b) { |
+/////////////////////////////////////////////////////////////////////////////// |
+ |
+/** |
+ * Applies a convolution effect which applies the convolution using a bilinear |
+ * sampling optimization to use half as many samples. |
+ */ |
+class GrGLBilerpConvolutionEffect : public GrGLConvolutionEffect { |
Stephen White
2015/06/26 21:28:31
<bikeshed> is this really a bilinear fetch? Or ess
ericrk
2015/06/29 17:33:21
yup - that's better :D
|
+public: |
+ GrGLBilerpConvolutionEffect(const GrProcessor& processor) : INHERITED(processor) {} |
+ |
+ virtual void emitCode(GrGLFPBuilder*, |
+ const GrFragmentProcessor&, |
+ const char* outputColor, |
+ const char* inputColor, |
+ const TransformedCoordsArray&, |
+ const TextureSamplerArray&) override; |
+ |
+ void setData(const GrGLProgramDataManager& pdman, const GrProcessor&) override; |
+ |
+private: |
+ int bilerpSampleCount() const; |
+ |
+ // Bounded uniforms |
+ UniformHandle fSampleWeightUni; |
+ UniformHandle fSampleOffsetUni; |
+ |
+ typedef GrGLConvolutionEffect INHERITED; |
+}; |
+ |
+void GrGLBilerpConvolutionEffect::emitCode(GrGLFPBuilder* builder, |
+ const GrFragmentProcessor& processor, |
+ const char* outputColor, |
+ const char* inputColor, |
+ const TransformedCoordsArray& coords, |
+ const TextureSamplerArray& samplers) { |
+ int sampleCount = bilerpSampleCount(); |
+ |
+ fSampleOffsetUni = |
Stephen White
2015/06/26 21:28:31
How many uniform values does this add up to? You m
ericrk
2015/06/29 17:33:21
I think we're safe (assuming we keep the limit of
Stephen White
2015/06/29 19:04:06
Yep; makes sense. Thanks!
|
+ builder->addUniformArray(GrGLProgramBuilder::kFragment_Visibility, kVec2f_GrSLType, |
+ kDefault_GrSLPrecision, "SampleOffset", sampleCount); |
+ fSampleWeightUni = |
+ builder->addUniformArray(GrGLProgramBuilder::kFragment_Visibility, kFloat_GrSLType, |
+ kDefault_GrSLPrecision, "SampleWeight", sampleCount); |
+ |
+ GrGLFragmentBuilder* fsBuilder = builder->getFragmentShaderBuilder(); |
+ SkString coords2D = fsBuilder->ensureFSCoords2D(coords, 0); |
+ |
+ fsBuilder->codeAppendf("\t\t%s = vec4(0, 0, 0, 0);\n", outputColor); |
bsalomon
2015/06/26 21:07:33
You don't really need the \t's anymore (we now "pr
ericrk
2015/06/26 21:28:22
removed the \t\ts throughout the file
|
+ |
+ const GrGLShaderVar& kernel = builder->getUniformVariable(fSampleWeightUni); |
+ const GrGLShaderVar& imgInc = builder->getUniformVariable(fSampleOffsetUni); |
+ |
+ fsBuilder->codeAppendf("\t\tvec2 coord; \n"); |
+ |
+ // Manually unroll loop because some drivers don't; yields 20-30% speedup. |
+ for (int i = 0; i < sampleCount; i++) { |
+ SkString index; |
+ SkString weightIndex; |
+ SkString offsetIndex; |
+ index.appendS32(i); |
+ kernel.appendArrayAccess(index.c_str(), &weightIndex); |
+ imgInc.appendArrayAccess(index.c_str(), &offsetIndex); |
+ fsBuilder->codeAppendf("\t\tcoord = %s + %s;\n", coords2D.c_str(), offsetIndex.c_str()); |
+ fsBuilder->codeAppendf("\t\t%s += ", outputColor); |
+ fsBuilder->appendTextureLookup(samplers[0], "coord"); |
+ fsBuilder->codeAppendf(" * %s;\n", weightIndex.c_str()); |
+ } |
+ |
+ SkString modulate; |
+ GrGLSLMulVarBy4f(&modulate, outputColor, inputColor); |
+ fsBuilder->codeAppend(modulate.c_str()); |
+} |
+ |
+void GrGLBilerpConvolutionEffect::setData(const GrGLProgramDataManager& pdman, |
+ const GrProcessor& processor) { |
const GrConvolutionEffect& conv = processor.cast<GrConvolutionEffect>(); |
- uint32_t key = conv.radius(); |
- key <<= 2; |
- if (conv.useBounds()) { |
- key |= 0x2; |
- key |= GrConvolutionEffect::kY_Direction == conv.direction() ? 0x1 : 0x0; |
+ |
+ // the code we generated was for a specific kernel radius |
+ SkASSERT(conv.radius() == this->radius()); |
+ |
+ // the code we generated was for a specific bounding mode. |
+ SkASSERT(conv.useBounds() == false); |
bsalomon
2015/06/26 21:07:34
!conv.useBounds()?
ericrk
2015/06/26 21:28:22
yup
|
+ |
+ int sampleCount = bilerpSampleCount(); |
+ SkAutoTArray<float> imageIncrements(sampleCount * 2); // X and Y floats per sample. |
+ SkAutoTArray<float> kernel(sampleCount); |
+ |
+ float baseImageIncrement[2]; |
+ getImageIncrement(conv, &baseImageIncrement); |
+ |
+ for (int i = 0; i < sampleCount; i++) { |
+ int sampleIndex1 = i * 2; |
+ int sampleIndex2 = sampleIndex1 + 1; |
+ |
+ // If we have an odd number of samples in our filter, the last sample won't use |
+ // the bilinear optimization (it will be pixel aligned). |
+ if (sampleIndex2 >= this->width()) { |
+ sampleIndex2 = sampleIndex1; |
+ } |
+ |
+ float kernelWeight1 = conv.kernel()[sampleIndex1]; |
+ float kernelWeight2 = conv.kernel()[sampleIndex2]; |
+ |
+ float totalKernalWeight = |
Stephen White
2015/06/26 21:28:31
Nit: kernal -> kernel?
|
+ (sampleIndex1 == sampleIndex2) ? kernelWeight1 : (kernelWeight1 + kernelWeight2); |
+ |
+ float sampleRatio = |
+ (sampleIndex1 == sampleIndex2) ? 0 : kernelWeight2 / (kernelWeight1 + kernelWeight2); |
+ |
+ imageIncrements[i * 2] = (-this->radius() + i * 2 + sampleRatio) * baseImageIncrement[0]; |
+ imageIncrements[i * 2 + 1] = |
+ (-this->radius() + i * 2 + sampleRatio) * baseImageIncrement[1]; |
+ |
+ kernel[i] = totalKernalWeight; |
} |
- b->add32(key); |
+ pdman.set2fv(fSampleOffsetUni, sampleCount, imageIncrements.get()); |
+ pdman.set1fv(fSampleWeightUni, sampleCount, kernel.get()); |
+} |
+ |
+int GrGLBilerpConvolutionEffect::bilerpSampleCount() const { |
+ // We use a bilinear optimization to only sample once for each two pixel aligned |
+ // samples in the kernel. If we have an odd number of samples, we will have to |
+ // skip this optimization for the last sample. Because of this we always round |
+ // up our sample count (by adding 1 before dividing). |
+ return (this->width() + 1) / 2; |
} |
/////////////////////////////////////////////////////////////////////////////// |
@@ -153,7 +306,12 @@ GrConvolutionEffect::GrConvolutionEffect(GrTexture* texture, |
const float* kernel, |
bool useBounds, |
float bounds[2]) |
- : Gr1DKernelEffect(texture, direction, radius), fUseBounds(useBounds) { |
+ : Gr1DKernelEffect(texture, |
+ direction, |
+ radius, |
+ useBounds ? GrTextureParams::FilterMode::kNone_FilterMode |
+ : GrTextureParams::FilterMode::kBilerp_FilterMode) |
+ , fUseBounds(useBounds) { |
this->initClassID<GrConvolutionEffect>(); |
SkASSERT(radius <= kMaxKernelRadius); |
SkASSERT(kernel); |
@@ -170,7 +328,12 @@ GrConvolutionEffect::GrConvolutionEffect(GrTexture* texture, |
float gaussianSigma, |
bool useBounds, |
float bounds[2]) |
- : Gr1DKernelEffect(texture, direction, radius), fUseBounds(useBounds) { |
+ : Gr1DKernelEffect(texture, |
+ direction, |
+ radius, |
+ useBounds ? GrTextureParams::FilterMode::kNone_FilterMode |
+ : GrTextureParams::FilterMode::kBilerp_FilterMode) |
+ , fUseBounds(useBounds) { |
this->initClassID<GrConvolutionEffect>(); |
SkASSERT(radius <= kMaxKernelRadius); |
int width = this->width(); |
@@ -201,7 +364,14 @@ void GrConvolutionEffect::getGLProcessorKey(const GrGLSLCaps& caps, |
} |
GrGLFragmentProcessor* GrConvolutionEffect::createGLInstance() const { |
- return SkNEW_ARGS(GrGLConvolutionEffect, (*this)); |
+ // We support a bilinear optimization which (when feasible) uses half the number |
+ // of samples to apply the kernel. This is not always applicable, as the |
+ // bilinear sampling optimization does not support bounded sampling. |
+ if (this->useBounds()) { |
+ return SkNEW_ARGS(GrGLBoundedConvolutionEffect, (*this)); |
+ } else { |
+ return SkNEW_ARGS(GrGLBilerpConvolutionEffect, (*this)); |
+ } |
} |
bool GrConvolutionEffect::onIsEqual(const GrFragmentProcessor& sBase) const { |