Fifth attempt to land faster rect blur. Remove unnecessary conditionals from the shader.

approved over in https://codereview.chromium.org/331863006/; reuploading
because it had the wrong base url

BUG=skia:2095
R=bsalomon@google.com
TBR=bsalomon

Author: humper@google.com

Review URL: https://codereview.chromium.org/341543005
This commit is contained in:
humper 2014-06-17 13:39:29 -07:00 committed by Commit bot
parent 9323b01e90
commit 4a24cd8ff4
4 changed files with 116 additions and 101 deletions

View File

@ -33,6 +33,19 @@
## epoger will rebaseline by 25 Dec 2013 ## epoger will rebaseline by 25 Dec 2013
#gradtext #gradtext
# reed: bitmapfilters changed (labels) with hide_config CL, just need rebaselines
bitmapfilters
# humper:
# Needs rebaselining after faster GPU blur patch lands
megalooper_0x0
megalooper_1x4
megalooper_4x1
bleed
blurquickreject
blurrects
bigblurs
# reed: https://codereview.chromium.org/190723004/ # reed: https://codereview.chromium.org/190723004/
# This change removes an API that this GM was testing. If/when it lands and sticks, # This change removes an API that this GM was testing. If/when it lands and sticks,
# I will likely just delete the GM. # I will likely just delete the GM.

View File

@ -557,40 +557,38 @@ public:
*/ */
static GrEffectRef* Create(GrContext *context, const SkRect& rect, static GrEffectRef* Create(GrContext *context, const SkRect& rect,
float sigma) { float sigma) {
GrTexture *horizontalScanline = NULL, *verticalScanline = NULL; GrTexture *blurProfileTexture = NULL;
bool createdScanlines = CreateScanlineTextures(context, sigma, int doubleProfileSize = SkScalarCeilToInt(12*sigma);
SkScalarCeilToInt(rect.width()),
SkScalarCeilToInt(rect.height()), if (doubleProfileSize >= rect.width() || doubleProfileSize >= rect.height()) {
&horizontalScanline, &verticalScanline); // if the blur sigma is too large so the gaussian overlaps the whole
SkAutoTUnref<GrTexture> hunref(horizontalScanline), vunref(verticalScanline); // rect in either direction, fall back to CPU path for now.
if (!createdScanlines) {
return NULL; return NULL;
} }
AutoEffectUnref effect(SkNEW_ARGS(GrRectBlurEffect, (rect, sigma,
horizontalScanline, verticalScanline))); bool createdBlurProfileTexture = CreateBlurProfileTexture(context, sigma, &blurProfileTexture);
SkAutoTUnref<GrTexture> hunref(blurProfileTexture);
if (!createdBlurProfileTexture) {
return NULL;
}
AutoEffectUnref effect(SkNEW_ARGS(GrRectBlurEffect, (rect, sigma, blurProfileTexture)));
return CreateEffectRef(effect); return CreateEffectRef(effect);
} }
unsigned int getWidth() const { return fWidth; } const SkRect& getRect() const { return fRect; }
unsigned int getHeight() const { return fHeight; }
float getSigma() const { return fSigma; } float getSigma() const { return fSigma; }
const GrCoordTransform& getTransform() const { return fTransform; }
private: private:
GrRectBlurEffect(const SkRect& rect, float sigma, GrRectBlurEffect(const SkRect& rect, float sigma, GrTexture *blur_profile);
GrTexture *horizontal_scanline, GrTexture *vertical_scanline);
virtual bool onIsEqual(const GrEffect&) const SK_OVERRIDE; virtual bool onIsEqual(const GrEffect&) const SK_OVERRIDE;
static bool CreateScanlineTextures(GrContext *context, float sigma, static bool CreateBlurProfileTexture(GrContext *context, float sigma,
unsigned int width, unsigned int height, GrTexture **blurProfileTexture);
GrTexture **horizontalScanline,
GrTexture **verticalScanline);
unsigned int fWidth, fHeight; SkRect fRect;
float fSigma; float fSigma;
GrTextureAccess fHorizontalScanlineAccess; GrTextureAccess fBlurProfileAccess;
GrTextureAccess fVerticalScanlineAccess;
GrCoordTransform fTransform;
GR_DECLARE_EFFECT_TEST; GR_DECLARE_EFFECT_TEST;
@ -614,16 +612,34 @@ public:
private: private:
typedef GrGLUniformManager::UniformHandle UniformHandle; typedef GrGLUniformManager::UniformHandle UniformHandle;
UniformHandle fWidthUni; UniformHandle fProxyRectUniform;
UniformHandle fHeightUni; UniformHandle fProfileSizeUniform;
typedef GrGLEffect INHERITED; typedef GrGLEffect INHERITED;
}; };
GrGLRectBlurEffect::GrGLRectBlurEffect(const GrBackendEffectFactory& factory, const GrDrawEffect&) GrGLRectBlurEffect::GrGLRectBlurEffect(const GrBackendEffectFactory& factory, const GrDrawEffect&)
: INHERITED(factory) { : INHERITED(factory) {
} }
void OutputRectBlurProfileLookup(GrGLShaderBuilder* builder,
const GrGLShaderBuilder::TextureSampler& sampler,
const char *output,
const char *profileSize, const char *loc,
const char *blurred_width,
const char *sharp_width) {
builder->fsCodeAppendf("\tfloat %s;\n", output);
builder->fsCodeAppendf("\t\t{\n");
builder->fsCodeAppendf("\t\t\tfloat coord = (0.5 * (abs(2.0*%s - %s) - %s))/%s;\n",
loc, blurred_width, sharp_width, profileSize);
builder->fsCodeAppendf("\t\t\t%s = ", output);
builder->fsAppendTextureLookup(sampler, "vec2(coord,0.5)");
builder->fsCodeAppend(".a;\n");
builder->fsCodeAppendf("\t\t}\n");
}
void GrGLRectBlurEffect::emitCode(GrGLShaderBuilder* builder, void GrGLRectBlurEffect::emitCode(GrGLShaderBuilder* builder,
const GrDrawEffect&, const GrDrawEffect&,
EffectKey key, EffectKey key,
@ -632,7 +648,19 @@ void GrGLRectBlurEffect::emitCode(GrGLShaderBuilder* builder,
const TransformedCoordsArray& coords, const TransformedCoordsArray& coords,
const TextureSamplerArray& samplers) { const TextureSamplerArray& samplers) {
SkString texture_coords = builder->ensureFSCoords2D(coords, 0); const char *rectName;
const char *profileSizeName;
fProxyRectUniform = builder->addUniform(GrGLShaderBuilder::kFragment_Visibility,
kVec4f_GrSLType,
"proxyRect",
&rectName);
fProfileSizeUniform = builder->addUniform(GrGLShaderBuilder::kFragment_Visibility,
kFloat_GrSLType,
"profileSize",
&profileSizeName);
const char *fragmentPos = builder->fragmentPosition();
if (inputColor) { if (inputColor) {
builder->fsCodeAppendf("\tvec4 src=%s;\n", inputColor); builder->fsCodeAppendf("\tvec4 src=%s;\n", inputColor);
@ -640,31 +668,38 @@ void GrGLRectBlurEffect::emitCode(GrGLShaderBuilder* builder,
builder->fsCodeAppendf("\tvec4 src=vec4(1)\n;"); builder->fsCodeAppendf("\tvec4 src=vec4(1)\n;");
} }
builder->fsCodeAppendf("\tvec4 horiz = "); builder->fsCodeAppendf("\tvec2 translatedPos = %s.xy - %s.xy;\n", fragmentPos, rectName );
builder->fsAppendTextureLookup( samplers[0], texture_coords.c_str() ); builder->fsCodeAppendf("\tfloat width = %s.z - %s.x;\n", rectName, rectName);
builder->fsCodeAppendf(";\n"); builder->fsCodeAppendf("\tfloat height = %s.w - %s.y;\n", rectName, rectName);
builder->fsCodeAppendf("\tvec4 vert = ");
builder->fsAppendTextureLookup( samplers[1], texture_coords.c_str() );
builder->fsCodeAppendf(";\n");
builder->fsCodeAppendf("\tfloat final = (horiz*vert).r;\n"); builder->fsCodeAppendf("\tvec2 smallDims = vec2(width - %s, height-%s);\n", profileSizeName, profileSizeName);
builder->fsCodeAppendf("\t%s = final*src;\n", outputColor); builder->fsCodeAppendf("\tfloat center = 2.0 * floor(%s/2.0 + .25) - 1.0;\n", profileSizeName);
builder->fsCodeAppendf("\tvec2 wh = smallDims - vec2(center,center);\n");
OutputRectBlurProfileLookup(builder, samplers[0], "horiz_lookup", profileSizeName, "translatedPos.x", "width", "wh.x");
OutputRectBlurProfileLookup(builder, samplers[0], "vert_lookup", profileSizeName, "translatedPos.y", "height", "wh.y");
builder->fsCodeAppendf("\tfloat final = horiz_lookup * vert_lookup;\n");
builder->fsCodeAppendf("\t%s = src * vec4(final);\n", outputColor );
} }
void GrGLRectBlurEffect::setData(const GrGLUniformManager& uman, void GrGLRectBlurEffect::setData(const GrGLUniformManager& uman,
const GrDrawEffect& drawEffect) { const GrDrawEffect& drawEffect) {
const GrRectBlurEffect& rbe = drawEffect.castEffect<GrRectBlurEffect>();
SkRect rect = rbe.getRect();
uman.set4f(fProxyRectUniform, rect.fLeft, rect.fTop, rect.fRight, rect.fBottom);
uman.set1f(fProfileSizeUniform, SkScalarCeilToScalar(6*rbe.getSigma()));
} }
bool GrRectBlurEffect::CreateScanlineTextures(GrContext *context, float sigma, bool GrRectBlurEffect::CreateBlurProfileTexture(GrContext *context, float sigma,
unsigned int width, unsigned int height, GrTexture **blurProfileTexture) {
GrTexture **horizontalScanline,
GrTexture **verticalScanline) {
GrTextureParams params; GrTextureParams params;
GrTextureDesc texDesc; GrTextureDesc texDesc;
unsigned int profile_size = SkScalarFloorToInt(6*sigma); unsigned int profile_size = SkScalarCeilToInt(6*sigma);
texDesc.fWidth = width; texDesc.fWidth = profile_size;
texDesc.fHeight = 1; texDesc.fHeight = 1;
texDesc.fConfig = kAlpha_8_GrPixelConfig; texDesc.fConfig = kAlpha_8_GrPixelConfig;
@ -672,73 +707,38 @@ bool GrRectBlurEffect::CreateScanlineTextures(GrContext *context, float sigma,
GrCacheID::Key key; GrCacheID::Key key;
memset(&key, 0, sizeof(key)); memset(&key, 0, sizeof(key));
key.fData32[0] = profile_size; key.fData32[0] = profile_size;
key.fData32[1] = width; key.fData32[1] = 1;
key.fData32[2] = 1; GrCacheID blurProfileKey(gBlurProfileDomain, key);
GrCacheID horizontalCacheID(gBlurProfileDomain, key);
uint8_t *profile = NULL; uint8_t *profile = NULL;
SkAutoTDeleteArray<uint8_t> ada(NULL); SkAutoTDeleteArray<uint8_t> ada(NULL);
*horizontalScanline = context->findAndRefTexture(texDesc, horizontalCacheID, &params); *blurProfileTexture = context->findAndRefTexture(texDesc, blurProfileKey, &params);
if (NULL == *horizontalScanline) { if (NULL == *blurProfileTexture) {
SkBlurMask::ComputeBlurProfile(sigma, &profile); SkBlurMask::ComputeBlurProfile(sigma, &profile);
ada.reset(profile); ada.reset(profile);
SkAutoTMalloc<uint8_t> horizontalPixels(width); *blurProfileTexture = context->createTexture(&params, texDesc, blurProfileKey,
SkBlurMask::ComputeBlurredScanline(horizontalPixels, profile, width, sigma); profile, 0);
*horizontalScanline = context->createTexture(&params, texDesc, horizontalCacheID, if (NULL == *blurProfileTexture) {
horizontalPixels, 0);
if (NULL == *horizontalScanline) {
return false; return false;
} }
} }
texDesc.fWidth = 1;
texDesc.fHeight = height;
key.fData32[1] = 1;
key.fData32[2] = height;
GrCacheID verticalCacheID(gBlurProfileDomain, key);
*verticalScanline = context->findAndRefTexture(texDesc, verticalCacheID, &params);
if (NULL == *verticalScanline) {
if (NULL == profile) {
SkBlurMask::ComputeBlurProfile(sigma, &profile);
ada.reset(profile);
}
SkAutoTMalloc<uint8_t> verticalPixels(height);
SkBlurMask::ComputeBlurredScanline(verticalPixels, profile, height, sigma);
*verticalScanline = context->createTexture(&params, texDesc, verticalCacheID,
verticalPixels, 0);
if (NULL == *verticalScanline) {
SkSafeSetNull(*horizontalScanline);
return false;
}
}
return true; return true;
} }
GrRectBlurEffect::GrRectBlurEffect(const SkRect& rect, float sigma, GrRectBlurEffect::GrRectBlurEffect(const SkRect& rect, float sigma,
GrTexture *horizontal_scanline, GrTexture *vertical_scanline) GrTexture *blur_profile)
: INHERITED(), : INHERITED(),
fWidth(horizontal_scanline->width()), fRect(rect),
fHeight(vertical_scanline->width()),
fSigma(sigma), fSigma(sigma),
fHorizontalScanlineAccess(horizontal_scanline), fBlurProfileAccess(blur_profile) {
fVerticalScanlineAccess(vertical_scanline) { this->addTextureAccess(&fBlurProfileAccess);
SkMatrix mat; this->setWillReadFragmentPosition();
mat.setRectToRect(rect, SkRect::MakeWH(1,1), SkMatrix::kFill_ScaleToFit);
fTransform.reset(kLocal_GrCoordSet, mat);
this->addTextureAccess(&fHorizontalScanlineAccess);
this->addTextureAccess(&fVerticalScanlineAccess);
this->addCoordTransform(&fTransform);
} }
GrRectBlurEffect::~GrRectBlurEffect() { GrRectBlurEffect::~GrRectBlurEffect() {
@ -750,10 +750,7 @@ const GrBackendEffectFactory& GrRectBlurEffect::getFactory() const {
bool GrRectBlurEffect::onIsEqual(const GrEffect& sBase) const { bool GrRectBlurEffect::onIsEqual(const GrEffect& sBase) const {
const GrRectBlurEffect& s = CastEffect<GrRectBlurEffect>(sBase); const GrRectBlurEffect& s = CastEffect<GrRectBlurEffect>(sBase);
return this->getWidth() == s.getWidth() && return this->getSigma() == s.getSigma() && this->getRect() == s.getRect();
this->getHeight() == s.getHeight() &&
this->getSigma() == s.getSigma() &&
this->getTransform() == s.getTransform();
} }
void GrRectBlurEffect::getConstantColorComponents(GrColor* color, uint32_t* validFlags) const { void GrRectBlurEffect::getConstantColorComponents(GrColor* color, uint32_t* validFlags) const {
@ -793,7 +790,9 @@ bool SkBlurMaskFilterImpl::directFilterMaskGPU(GrContext* context,
SkMatrix ctm = context->getMatrix(); SkMatrix ctm = context->getMatrix();
SkScalar xformedSigma = this->computeXformedSigma(ctm); SkScalar xformedSigma = this->computeXformedSigma(ctm);
rect.outset(3*xformedSigma, 3*xformedSigma);
int pad=SkScalarCeilToInt(6*xformedSigma)/2;
rect.outset(SkIntToScalar(pad), SkIntToScalar(pad));
SkAutoTUnref<GrEffectRef> effect(GrRectBlurEffect::Create( SkAutoTUnref<GrEffectRef> effect(GrRectBlurEffect::Create(
context, rect, xformedSigma)); context, rect, xformedSigma));
@ -806,7 +805,6 @@ bool SkBlurMaskFilterImpl::directFilterMaskGPU(GrContext* context,
return false; return false;
} }
grp->addCoverageEffect(effect); grp->addCoverageEffect(effect);
context->drawRect(*grp, rect); context->drawRect(*grp, rect);

View File

@ -216,7 +216,7 @@ bool GrGLShaderBuilder::genProgram(const GrEffectStage* colorStages[],
if (GrGLProgramDesc::kSecondaryCoverageISA_CoverageOutput == header.fCoverageOutput) { if (GrGLProgramDesc::kSecondaryCoverageISA_CoverageOutput == header.fCoverageOutput) {
// Get (1-A) into coeff // Get (1-A) into coeff
coeff = GrGLSLExpr4::VectorCast(GrGLSLExpr1(1) - inputColor.a()); coeff = GrGLSLExpr4::VectorCast(GrGLSLExpr1(1) - inputColor.a());
} else if (GrGLProgramDesc::kSecondaryCoverageISC_CoverageOutput == } else if (GrGLProgramDesc::kSecondaryCoverageISC_CoverageOutput ==
header.fCoverageOutput){ header.fCoverageOutput){
// Get (1-RGBA) into coeff // Get (1-RGBA) into coeff
coeff = GrGLSLExpr4(1) - inputColor; coeff = GrGLSLExpr4(1) - inputColor;

View File

@ -273,6 +273,8 @@ static void cpu_blur_path(const SkPath& path, SkScalar gaussianSigma,
} }
#if SK_SUPPORT_GPU #if SK_SUPPORT_GPU
#if 0
// temporary disable; see below for explanation
static bool gpu_blur_path(GrContextFactory* factory, const SkPath& path, static bool gpu_blur_path(GrContextFactory* factory, const SkPath& path,
SkScalar gaussianSigma, SkScalar gaussianSigma,
int* result, int resultCount) { int* result, int resultCount) {
@ -298,6 +300,7 @@ static bool gpu_blur_path(GrContextFactory* factory, const SkPath& path,
return true; return true;
} }
#endif #endif
#endif
#if WRITE_CSV #if WRITE_CSV
static void write_as_csv(const char* label, SkScalar scale, int* data, int count) { static void write_as_csv(const char* label, SkScalar scale, int* data, int count) {
@ -343,9 +346,6 @@ static void test_sigma_range(skiatest::Reporter* reporter, GrContextFactory* fac
int rectSpecialCaseResult[kSize]; int rectSpecialCaseResult[kSize];
int generalCaseResult[kSize]; int generalCaseResult[kSize];
#if SK_SUPPORT_GPU
int gpuResult[kSize];
#endif
int groundTruthResult[kSize]; int groundTruthResult[kSize];
int bruteForce1DResult[kSize]; int bruteForce1DResult[kSize];
@ -355,19 +355,23 @@ static void test_sigma_range(skiatest::Reporter* reporter, GrContextFactory* fac
cpu_blur_path(rectPath, sigma, rectSpecialCaseResult, kSize); cpu_blur_path(rectPath, sigma, rectSpecialCaseResult, kSize);
cpu_blur_path(polyPath, sigma, generalCaseResult, kSize); cpu_blur_path(polyPath, sigma, generalCaseResult, kSize);
#if SK_SUPPORT_GPU
bool haveGPUResult = gpu_blur_path(factory, rectPath, sigma, gpuResult, kSize);
#endif
ground_truth_2d(100, 100, sigma, groundTruthResult, kSize); ground_truth_2d(100, 100, sigma, groundTruthResult, kSize);
brute_force_1d(-50.0f, 50.0f, sigma, bruteForce1DResult, kSize); brute_force_1d(-50.0f, 50.0f, sigma, bruteForce1DResult, kSize);
REPORTER_ASSERT(reporter, match(rectSpecialCaseResult, bruteForce1DResult, kSize, 5)); REPORTER_ASSERT(reporter, match(rectSpecialCaseResult, bruteForce1DResult, kSize, 5));
REPORTER_ASSERT(reporter, match(generalCaseResult, bruteForce1DResult, kSize, 15)); REPORTER_ASSERT(reporter, match(generalCaseResult, bruteForce1DResult, kSize, 15));
#if SK_SUPPORT_GPU #if SK_SUPPORT_GPU
#if 0
int gpuResult[kSize];
bool haveGPUResult = gpu_blur_path(factory, rectPath, sigma, gpuResult, kSize);
// Disabling this test for now -- I don't think it's a legit comparison.
// Will continue to investigate this.
if (haveGPUResult) { if (haveGPUResult) {
// 1 works everywhere but: Ubuntu13 & Nexus4 // 1 works everywhere but: Ubuntu13 & Nexus4
REPORTER_ASSERT(reporter, match(gpuResult, bruteForce1DResult, kSize, 10)); REPORTER_ASSERT(reporter, match(gpuResult, bruteForce1DResult, kSize, 10));
} }
#endif
#endif #endif
REPORTER_ASSERT(reporter, match(groundTruthResult, bruteForce1DResult, kSize, 1)); REPORTER_ASSERT(reporter, match(groundTruthResult, bruteForce1DResult, kSize, 1));