/* * Copyright 2011 The Android Open Source Project * * Use of this source code is governed by a BSD-style license that can be * found in the LICENSE file. */ #include "SkBitmap.h" #include "SkBlurImageFilter.h" #include "SkColorPriv.h" #include "SkFlattenableBuffers.h" #include "SkGpuBlurUtils.h" #include "SkBlurImage_opts.h" #if SK_SUPPORT_GPU #include "GrContext.h" #include "SkImageFilterUtils.h" #endif SkBlurImageFilter::SkBlurImageFilter(SkFlattenableReadBuffer& buffer) : INHERITED(1, buffer) { fSigma.fWidth = buffer.readScalar(); fSigma.fHeight = buffer.readScalar(); buffer.validate(SkScalarIsFinite(fSigma.fWidth) && SkScalarIsFinite(fSigma.fHeight) && (fSigma.fWidth >= 0) && (fSigma.fHeight >= 0)); } SkBlurImageFilter::SkBlurImageFilter(SkScalar sigmaX, SkScalar sigmaY, SkImageFilter* input, const CropRect* cropRect) : INHERITED(input, cropRect), fSigma(SkSize::Make(sigmaX, sigmaY)) { SkASSERT(sigmaX >= 0 && sigmaY >= 0); } void SkBlurImageFilter::flatten(SkFlattenableWriteBuffer& buffer) const { this->INHERITED::flatten(buffer); buffer.writeScalar(fSigma.fWidth); buffer.writeScalar(fSigma.fHeight); } enum BlurDirection { kX, kY }; /** * * In order to make memory accesses cache-friendly, we reorder the passes to * use contiguous memory reads wherever possible. * * For example, the 6 passes of the X-and-Y blur case are rewritten as * follows. Instead of 3 passes in X and 3 passes in Y, we perform * 2 passes in X, 1 pass in X transposed to Y on write, 2 passes in X, * then 1 pass in X transposed to Y on write. * * +----+ +----+ +----+ +---+ +---+ +---+ +----+ * + AB + ----> | AB | ----> | AB | -----> | A | ----> | A | ----> | A | -----> | AB | * +----+ blurX +----+ blurX +----+ blurXY | B | blurX | B | blurX | B | blurXY +----+ * +---+ +---+ +---+ * * In this way, two of the y-blurs become x-blurs applied to transposed * images, and all memory reads are contiguous. */ template static void boxBlur(const SkPMColor* src, int srcStride, SkPMColor* dst, int kernelSize, int leftOffset, int rightOffset, int width, int height) { int rightBorder = SkMin32(rightOffset + 1, width); int srcStrideX = srcDirection == kX ? 1 : srcStride; int dstStrideX = dstDirection == kX ? 1 : height; int srcStrideY = srcDirection == kX ? srcStride : 1; int dstStrideY = dstDirection == kX ? width : 1; uint32_t scale = (1 << 24) / kernelSize; uint32_t half = 1 << 23; for (int y = 0; y < height; ++y) { int sumA = 0, sumR = 0, sumG = 0, sumB = 0; const SkPMColor* p = src; for (int i = 0; i < rightBorder; ++i) { sumA += SkGetPackedA32(*p); sumR += SkGetPackedR32(*p); sumG += SkGetPackedG32(*p); sumB += SkGetPackedB32(*p); p += srcStrideX; } const SkPMColor* sptr = src; SkColor* dptr = dst; for (int x = 0; x < width; ++x) { *dptr = SkPackARGB32((sumA * scale + half) >> 24, (sumR * scale + half) >> 24, (sumG * scale + half) >> 24, (sumB * scale + half) >> 24); if (x >= leftOffset) { SkColor l = *(sptr - leftOffset * srcStrideX); sumA -= SkGetPackedA32(l); sumR -= SkGetPackedR32(l); sumG -= SkGetPackedG32(l); sumB -= SkGetPackedB32(l); } if (x + rightOffset + 1 < width) { SkColor r = *(sptr + (rightOffset + 1) * srcStrideX); sumA += SkGetPackedA32(r); sumR += SkGetPackedR32(r); sumG += SkGetPackedG32(r); sumB += SkGetPackedB32(r); } sptr += srcStrideX; if (srcDirection == kY) { SK_PREFETCH(sptr + (rightOffset + 1) * srcStrideX); } dptr += dstStrideX; } src += srcStrideY; dst += dstStrideY; } } static void getBox3Params(SkScalar s, int *kernelSize, int* kernelSize3, int *lowOffset, int *highOffset) { float pi = SkScalarToFloat(SK_ScalarPI); int d = static_cast(floorf(SkScalarToFloat(s) * 3.0f * sqrtf(2.0f * pi) / 4.0f + 0.5f)); *kernelSize = d; if (d % 2 == 1) { *lowOffset = *highOffset = (d - 1) / 2; *kernelSize3 = d; } else { *highOffset = d / 2; *lowOffset = *highOffset - 1; *kernelSize3 = d + 1; } } bool SkBlurImageFilter::onFilterImage(Proxy* proxy, const SkBitmap& source, const SkMatrix& ctm, SkBitmap* dst, SkIPoint* offset) { SkBitmap src = source; if (getInput(0) && !getInput(0)->filterImage(proxy, source, ctm, &src, offset)) { return false; } if (src.config() != SkBitmap::kARGB_8888_Config) { return false; } SkAutoLockPixels alp(src); if (!src.getPixels()) { return false; } SkIRect srcBounds, dstBounds; src.getBounds(&srcBounds); if (!this->applyCropRect(&srcBounds, ctm)) { return false; } dst->setConfig(src.config(), srcBounds.width(), srcBounds.height()); dst->getBounds(&dstBounds); dst->allocPixels(); if (!dst->getPixels()) { return false; } int kernelSizeX, kernelSizeX3, lowOffsetX, highOffsetX; int kernelSizeY, kernelSizeY3, lowOffsetY, highOffsetY; getBox3Params(fSigma.width(), &kernelSizeX, &kernelSizeX3, &lowOffsetX, &highOffsetX); getBox3Params(fSigma.height(), &kernelSizeY, &kernelSizeY3, &lowOffsetY, &highOffsetY); if (kernelSizeX < 0 || kernelSizeY < 0) { return false; } if (kernelSizeX == 0 && kernelSizeY == 0) { src.copyTo(dst, dst->config()); return true; } SkBitmap temp; temp.setConfig(dst->config(), dst->width(), dst->height()); if (!temp.allocPixels()) { return false; } const SkPMColor* s = src.getAddr32(srcBounds.left(), srcBounds.top()); SkPMColor* t = temp.getAddr32(0, 0); SkPMColor* d = dst->getAddr32(0, 0); int w = dstBounds.width(), h = dstBounds.height(); int sw = src.rowBytesAsPixels(); SkBoxBlurProc boxBlurX, boxBlurY, boxBlurXY, boxBlurYX; if (!SkBoxBlurGetPlatformProcs(&boxBlurX, &boxBlurY, &boxBlurXY, &boxBlurYX)) { boxBlurX = boxBlur; boxBlurY = boxBlur; boxBlurXY = boxBlur; boxBlurYX = boxBlur; } if (kernelSizeX > 0 && kernelSizeY > 0) { boxBlurX(s, sw, t, kernelSizeX, lowOffsetX, highOffsetX, w, h); boxBlurX(t, w, d, kernelSizeX, highOffsetX, lowOffsetX, w, h); boxBlurXY(d, w, t, kernelSizeX3, highOffsetX, highOffsetX, w, h); boxBlurX(t, h, d, kernelSizeY, lowOffsetY, highOffsetY, h, w); boxBlurX(d, h, t, kernelSizeY, highOffsetY, lowOffsetY, h, w); boxBlurXY(t, h, d, kernelSizeY3, highOffsetY, highOffsetY, h, w); } else if (kernelSizeX > 0) { boxBlurX(s, sw, d, kernelSizeX, lowOffsetX, highOffsetX, w, h); boxBlurX(d, w, t, kernelSizeX, highOffsetX, lowOffsetX, w, h); boxBlurX(t, w, d, kernelSizeX3, highOffsetX, highOffsetX, w, h); } else if (kernelSizeY > 0) { boxBlurYX(s, sw, d, kernelSizeY, lowOffsetY, highOffsetY, h, w); boxBlurX(d, h, t, kernelSizeY, highOffsetY, lowOffsetY, h, w); boxBlurXY(t, h, d, kernelSizeY3, highOffsetY, highOffsetY, h, w); } offset->fX += srcBounds.fLeft; offset->fY += srcBounds.fTop; return true; } bool SkBlurImageFilter::filterImageGPU(Proxy* proxy, const SkBitmap& src, const SkMatrix& ctm, SkBitmap* result, SkIPoint* offset) { #if SK_SUPPORT_GPU SkBitmap input; if (!SkImageFilterUtils::GetInputResultGPU(getInput(0), proxy, src, ctm, &input, offset)) { return false; } GrTexture* source = input.getTexture(); SkIRect rect; src.getBounds(&rect); if (!this->applyCropRect(&rect, ctm)) { return false; } SkAutoTUnref tex(SkGpuBlurUtils::GaussianBlur(source->getContext(), source, false, SkRect::Make(rect), true, fSigma.width(), fSigma.height())); offset->fX += rect.fLeft; offset->fY += rect.fTop; return SkImageFilterUtils::WrapTexture(tex, rect.width(), rect.height(), result); #else SkDEBUGFAIL("Should not call in GPU-less build"); return false; #endif }