SkBlurMask.cpp revision 9c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254
1ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com
2ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com/*
3ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com * Copyright 2006 The Android Open Source Project
4ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com *
5ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com * Use of this source code is governed by a BSD-style license that can be
6ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com * found in the LICENSE file.
7ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com */
8ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com
98a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
108a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com#include "SkBlurMask.h"
11889bd8bd7f604acae0a6303365bc82c06da1e6f3tomhudson@google.com#include "SkMath.h"
128a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com#include "SkTemplates.h"
1301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#include "SkEndian.h"
1401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com
158ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com// scale factor for the blur radius to match the behavior of the all existing blur
167c7292c6071898d73dc935c3b66b9816183806f0humper@google.com// code (both on the CPU and the GPU).  This magic constant is  1/sqrt(3).
177c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
188ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com// TODO: get rid of this fudge factor and move any required fudging up into
197c7292c6071898d73dc935c3b66b9816183806f0humper@google.com// the calling library
207c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
217c7292c6071898d73dc935c3b66b9816183806f0humper@google.com#define kBlurRadiusFudgeFactor SkFloatToScalar( .57735f )
227c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
239b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define UNROLL_SEPARABLE_LOOPS
249b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org
25908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org/**
26908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org * This function performs a box blur in X, of the given radius.  If the
27884e60be30e20f38b3466a4697081187d2f1f814skia.committer@gmail.com * "transpose" parameter is true, it will transpose the pixels on write,
28908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org * such that X and Y are swapped. Reads are always performed from contiguous
29908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org * memory in X, for speed. The destination buffer (dst) must be at least
309b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org * (width + leftRadius + rightRadius) * height bytes in size.
31908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org */
32908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.orgstatic int boxBlur(const uint8_t* src, int src_y_stride, uint8_t* dst,
33c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org                   int leftRadius, int rightRadius, int width, int height,
34c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org                   bool transpose)
3571f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org{
369b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    int diameter = leftRadius + rightRadius;
379b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    int kernelSize = diameter + 1;
389b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    int border = SkMin32(width, diameter);
3971f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org    uint32_t scale = (1 << 24) / kernelSize;
40c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org    int new_width = width + SkMax32(leftRadius, rightRadius) * 2;
41908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org    int dst_x_stride = transpose ? height : 1;
42908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org    int dst_y_stride = transpose ? 1 : new_width;
4371f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org    for (int y = 0; y < height; ++y) {
4471f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org        int sum = 0;
45908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org        uint8_t* dptr = dst + y * dst_y_stride;
46908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org        const uint8_t* right = src + y * src_y_stride;
47908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org        const uint8_t* left = right;
48336b4da6b0d20f27f9980b03415354a2f0698e18senorblanco@chromium.org        for (int x = 0; x < rightRadius - leftRadius; x++) {
49336b4da6b0d20f27f9980b03415354a2f0698e18senorblanco@chromium.org            *dptr = 0;
50336b4da6b0d20f27f9980b03415354a2f0698e18senorblanco@chromium.org            dptr += dst_x_stride;
51c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org        }
529b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define LEFT_BORDER_ITER \
539b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            sum += *right++; \
549b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            *dptr = (sum * scale) >> 24; \
55908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org            dptr += dst_x_stride;
569b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org
579b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        int x = 0;
589b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS
599b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (; x < border - 16; x += 16) {
609b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
619b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
629b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
639b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
649b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
659b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
669b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
679b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
689b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
699b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
709b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
719b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
729b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
739b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
749b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
759b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
7671f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org        }
779b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif
789b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (; x < border; ++x) {
799b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
809b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        }
819b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef LEFT_BORDER_ITER
829b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define TRIVIAL_ITER \
839b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            *dptr = (sum * scale) >> 24; \
84908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org            dptr += dst_x_stride;
859b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        x = width;
869b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS
879b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (; x < diameter - 16; x += 16) {
889b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
899b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
909b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
919b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
929b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
939b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
949b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
959b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
969b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
979b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
989b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
999b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
1009b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
1019b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
1029b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
1039b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
1049b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        }
1059b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif
1069b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (; x < diameter; ++x) {
1079b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
10871f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org        }
1099b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef TRIVIAL_ITER
1109b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define CENTER_ITER \
1119b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            sum += *right++; \
1129b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            *dptr = (sum * scale) >> 24; \
1139b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            sum -= *left++; \
114908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org            dptr += dst_x_stride;
1159b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org
1169b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        x = diameter;
1179b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS
1189b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (; x < width - 16; x += 16) {
1199b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1209b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1219b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1229b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1239b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1249b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1259b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1269b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1279b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1289b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1299b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1309b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1319b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1329b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1339b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1349b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1359b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        }
1369b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif
1379b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (; x < width; ++x) {
1389b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
13971f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org        }
1409b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef CENTER_ITER
1419b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define RIGHT_BORDER_ITER \
1429b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            *dptr = (sum * scale) >> 24; \
1439b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            sum -= *left++; \
144908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org            dptr += dst_x_stride;
1459b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org
1469b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        x = 0;
1479b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS
1489b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (; x < border - 16; x += 16) {
1499b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
1509b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
1519b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
1529b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
1539b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
1549b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
1559b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
1569b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
1579b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
1589b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
1599b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
1609b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
1619b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
1629b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
1639b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
1649b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
1659b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        }
1669b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif
1679b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (; x < border; ++x) {
1689b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
16971f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org        }
1709b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef RIGHT_BORDER_ITER
171336b4da6b0d20f27f9980b03415354a2f0698e18senorblanco@chromium.org        for (int x = 0; x < leftRadius - rightRadius; x++) {
172336b4da6b0d20f27f9980b03415354a2f0698e18senorblanco@chromium.org            *dptr = 0;
173336b4da6b0d20f27f9980b03415354a2f0698e18senorblanco@chromium.org            dptr += dst_x_stride;
174c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org        }
17571f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org        SkASSERT(sum == 0);
17671f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org    }
177908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org    return new_width;
17871f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org}
17971f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org
1809b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org/**
1819b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org * This variant of the box blur handles blurring of non-integer radii.  It
1829b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org * keeps two running sums: an outer sum for the rounded-up kernel radius, and
1839b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org * an inner sum for the rounded-down kernel radius.  For each pixel, it linearly
1849b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org * interpolates between them.  In float this would be:
1859b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org *  outer_weight * outer_sum / kernelSize +
1869b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org *  (1.0 - outer_weight) * innerSum / (kernelSize - 2)
1879b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org */
1889b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.orgstatic int boxBlurInterp(const uint8_t* src, int src_y_stride, uint8_t* dst,
1899b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org                         int radius, int width, int height,
1909b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org                         bool transpose, uint8_t outer_weight)
1919b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org{
1929b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    int diameter = radius * 2;
1939b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    int kernelSize = diameter + 1;
1949b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    int border = SkMin32(width, diameter);
1959b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    int inner_weight = 255 - outer_weight;
1969b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    outer_weight += outer_weight >> 7;
1979b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    inner_weight += inner_weight >> 7;
1989b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    uint32_t outer_scale = (outer_weight << 16) / kernelSize;
1999b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    uint32_t inner_scale = (inner_weight << 16) / (kernelSize - 2);
2009b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    int new_width = width + diameter;
2019b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    int dst_x_stride = transpose ? height : 1;
2029b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    int dst_y_stride = transpose ? 1 : new_width;
2039b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    for (int y = 0; y < height; ++y) {
2049b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        int outer_sum = 0, inner_sum = 0;
2059b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        uint8_t* dptr = dst + y * dst_y_stride;
2069b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        const uint8_t* right = src + y * src_y_stride;
2079b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        const uint8_t* left = right;
2089b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        int x = 0;
2099b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org
2109b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define LEFT_BORDER_ITER \
2119b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            inner_sum = outer_sum; \
2129b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            outer_sum += *right++; \
2139b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            *dptr = (outer_sum * outer_scale + inner_sum * inner_scale) >> 24; \
2149b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            dptr += dst_x_stride;
2159b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org
2169b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS
2179b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (;x < border - 16; x += 16) {
2189b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
2199b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
2209b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
2219b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
2229b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
2239b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
2249b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
2259b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
2269b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
2279b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
2289b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
2299b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
2309b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
2319b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
2329b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
2339b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
2349b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        }
2359b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif
2369b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org
2379b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (;x < border; x++) {
2389b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
2399b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        }
2409b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef LEFT_BORDER_ITER
2419b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (int x = width; x < diameter; ++x) {
2429b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            *dptr = (outer_sum * outer_scale + inner_sum * inner_scale) >> 24;
2439b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            dptr += dst_x_stride;
2449b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        }
2459b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        x = diameter;
2469b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org
2479b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define CENTER_ITER \
2489b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            inner_sum = outer_sum - *left; \
2499b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            outer_sum += *right++; \
2509b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            *dptr = (outer_sum * outer_scale + inner_sum * inner_scale) >> 24; \
2519b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            dptr += dst_x_stride; \
2529b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            outer_sum -= *left++;
2539b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org
2549b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS
2559b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (; x < width - 16; x += 16) {
2569b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
2579b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
2589b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
2599b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
2609b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
2619b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
2629b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
2639b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
2649b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
2659b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
2669b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
2679b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
2689b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
2699b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
2709b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
2719b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
2729b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        }
2739b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif
2749b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (; x < width; ++x) {
2759b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
2769b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        }
2779b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef CENTER_ITER
2789b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org
2799b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        #define RIGHT_BORDER_ITER \
2809b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            inner_sum = outer_sum - *left++; \
2819b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            *dptr = (outer_sum * outer_scale + inner_sum * inner_scale) >> 24; \
2829b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            dptr += dst_x_stride; \
2839b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            outer_sum = inner_sum;
2849b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org
2859b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        x = 0;
2869b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS
2879b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (; x < border - 16; x += 16) {
2889b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
2899b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
2909b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
2919b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
2929b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
2939b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
2949b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
2959b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
2969b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
2979b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
2989b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
2999b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
3009b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
3019b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
3029b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
3039b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
3049b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        }
3059b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif
3069b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (; x < border; x++) {
3079b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
3089b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        }
3099b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef RIGHT_BORDER_ITER
3109b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        SkASSERT(outer_sum == 0 && inner_sum == 0);
3119b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    }
3129b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    return new_width;
3139b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org}
3149b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org
315c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.orgstatic void get_adjusted_radii(SkScalar passRadius, int *loRadius, int *hiRadius)
316c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org{
317c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org    *loRadius = *hiRadius = SkScalarCeil(passRadius);
318c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org    if (SkIntToScalar(*hiRadius) - passRadius > SkFloatToScalar(0.5f)) {
319c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org        *loRadius = *hiRadius - 1;
320c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org    }
321c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org}
322c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org
32301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com// Unrolling the integer blur kernel seems to give us a ~15% speedup on Windows,
32401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com// breakeven on Mac, and ~15% slowdown on Linux.
32501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com// Reading a word at a time when bulding the sum buffer seems to give
32601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com// us no appreciable speedup on Windows or Mac, and 2% slowdown on Linux.
327054ff1efa4f9187ce7fd20aaf3aed7cecf14e12btomhudson@google.com#if defined(SK_BUILD_FOR_WIN32)
32801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#define UNROLL_KERNEL_LOOP 1
32901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#endif
3308a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
3314560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com/** The sum buffer is an array of u32 to hold the accumulated sum of all of the
3324560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    src values at their position, plus all values above and to the left.
3334560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    When we sample into this buffer, we need an initial row and column of 0s,
3344560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    so we have an index correspondence as follows:
335fbfcd5602128ec010c82cb733c9cdc0a3254f9f3rmistry@google.com
3364560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    src[i, j] == sum[i+1, j+1]
3374560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    sum[0, j] == sum[i, 0] == 0
338fbfcd5602128ec010c82cb733c9cdc0a3254f9f3rmistry@google.com
3394560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    We assume that the sum buffer's stride == its width
3404560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com */
34103016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.comstatic void build_sum_buffer(uint32_t sum[], int srcW, int srcH,
34203016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com                             const uint8_t src[], int srcRB) {
3434560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    int sumW = srcW + 1;
3444560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com
3454560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    SkASSERT(srcRB >= srcW);
3468a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    // mod srcRB so we can apply it after each row
3474560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    srcRB -= srcW;
3488a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
3498a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    int x, y;
3508a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
3514560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    // zero out the top row and column
3524560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    memset(sum, 0, sumW * sizeof(sum[0]));
3534560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    sum += sumW;
3544560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com
3558a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    // special case first row
3568a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    uint32_t X = 0;
3574560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    *sum++ = 0; // initialze the first column to 0
35803016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com    for (x = srcW - 1; x >= 0; --x) {
3598a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        X = *src++ + X;
3604560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com        *sum++ = X;
3618a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    }
3628a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    src += srcRB;
3638a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
3648a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    // now do the rest of the rows
36503016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com    for (y = srcH - 1; y > 0; --y) {
3668a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        uint32_t L = 0;
3678a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        uint32_t C = 0;
3684560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com        *sum++ = 0; // initialze the first column to 0
36901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com
37001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        for (x = srcW - 1; !SkIsAlign4((intptr_t) src) && x >= 0; x--) {
37101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            uint32_t T = sum[-sumW];
37201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            X = *src++ + L + T - C;
37301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            *sum++ = X;
37401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            L = X;
37501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            C = T;
37601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        }
37701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com
37801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        for (; x >= 4; x-=4) {
37901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            uint32_t T = sum[-sumW];
38001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            X = *src++ + L + T - C;
38101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            *sum++ = X;
38201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            L = X;
38301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            C = T;
38401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            T = sum[-sumW];
38501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            X = *src++ + L + T - C;
38601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            *sum++ = X;
38701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            L = X;
38801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            C = T;
38901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            T = sum[-sumW];
39001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            X = *src++ + L + T - C;
39101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            *sum++ = X;
39201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            L = X;
39301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            C = T;
39401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            T = sum[-sumW];
39501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            X = *src++ + L + T - C;
39601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            *sum++ = X;
39701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            L = X;
39801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            C = T;
39901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        }
40001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com
40101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        for (; x >= 0; --x) {
4024560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com            uint32_t T = sum[-sumW];
4038a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            X = *src++ + L + T - C;
4044560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com            *sum++ = X;
4058a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            L = X;
4068a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            C = T;
4078a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        }
4088a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        src += srcRB;
4098a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    }
4108a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com}
4118a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
41203016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com/**
4138caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * This is the path for apply_kernel() to be taken when the kernel
4148caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * is wider than the source image.
4158caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com */
4168caac6447dd68655b57dfe876626a9733b191416tomhudson@google.comstatic void kernel_clamped(uint8_t dst[], int rx, int ry, const uint32_t sum[],
4178caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                           int sw, int sh) {
4188caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    SkASSERT(2*rx > sw);
4198caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
4208caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    uint32_t scale = (1 << 24) / ((2*rx + 1)*(2*ry + 1));
4218caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
4228caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    int sumStride = sw + 1;
4238caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
4248caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    int dw = sw + 2*rx;
4258caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    int dh = sh + 2*ry;
4268caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
4278caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    int prev_y = -2*ry;
4288caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    int next_y = 1;
4298caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
4308caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    for (int y = 0; y < dh; y++) {
4318caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        int py = SkClampPos(prev_y) * sumStride;
4328caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        int ny = SkFastMin32(next_y, sh) * sumStride;
4338caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
4348caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        int prev_x = -2*rx;
4358caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        int next_x = 1;
4368caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
4378caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        for (int x = 0; x < dw; x++) {
4388caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int px = SkClampPos(prev_x);
4398caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int nx = SkFastMin32(next_x, sw);
4408caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
4418caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            uint32_t tmp = sum[px+py] + sum[nx+ny] - sum[nx+py] - sum[px+ny];
4428caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            *dst++ = SkToU8(tmp * scale >> 24);
4438caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
4448caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            prev_x += 1;
4458caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            next_x += 1;
4468caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        }
4478caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
4488caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        prev_y += 1;
4498caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        next_y += 1;
4508caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    }
4518caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com}
4528caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com/**
45303016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com *  sw and sh are the width and height of the src. Since the sum buffer
45403016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com *  matches that, but has an extra row and col at the beginning (with zeros),
45503016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com *  we can just use sw and sh as our "max" values for pinning coordinates
45603016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com *  when sampling into sum[][]
4578caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *
4588caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *  The inner loop is conceptually simple; we break it into several sections
4598caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *  to improve performance. Here's the original version:
4608caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        for (int x = 0; x < dw; x++) {
4618caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int px = SkClampPos(prev_x);
4628caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int nx = SkFastMin32(next_x, sw);
4638caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
4648caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            uint32_t tmp = sum[px+py] + sum[nx+ny] - sum[nx+py] - sum[px+ny];
4658caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            *dst++ = SkToU8(tmp * scale >> 24);
4668caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
4678caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            prev_x += 1;
4688caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            next_x += 1;
4698caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        }
47001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *  The sections are:
47101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *     left-hand section, where prev_x is clamped to 0
47201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *     center section, where neither prev_x nor next_x is clamped
47301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *     right-hand section, where next_x is clamped to sw
47401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *  On some operating systems, the center section is unrolled for additional
47501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *  speedup.
4768caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com*/
4774560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.comstatic void apply_kernel(uint8_t dst[], int rx, int ry, const uint32_t sum[],
4784560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com                         int sw, int sh) {
4798caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    if (2*rx > sw) {
4808caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        kernel_clamped(dst, rx, ry, sum, sw, sh);
4818caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        return;
4828caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    }
4838caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
4848a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    uint32_t scale = (1 << 24) / ((2*rx + 1)*(2*ry + 1));
4858a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
4864560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    int sumStride = sw + 1;
4878a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
4888a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    int dw = sw + 2*rx;
4898a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    int dh = sh + 2*ry;
4908a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
4914560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    int prev_y = -2*ry;
4924560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    int next_y = 1;
4938a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
4948caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    SkASSERT(2*rx <= dw - 2*rx);
4958caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
4964560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    for (int y = 0; y < dh; y++) {
4974560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com        int py = SkClampPos(prev_y) * sumStride;
4984560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com        int ny = SkFastMin32(next_y, sh) * sumStride;
4998a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
5004560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com        int prev_x = -2*rx;
5014560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com        int next_x = 1;
5028caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        int x = 0;
5038caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5048caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        for (; x < 2*rx; x++) {
5058caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            SkASSERT(prev_x <= 0);
5068caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            SkASSERT(next_x <= sw);
5078caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5088caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int px = 0;
5098caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int nx = next_x;
5108caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5118caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            uint32_t tmp = sum[px+py] + sum[nx+ny] - sum[nx+py] - sum[px+ny];
5128caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            *dst++ = SkToU8(tmp * scale >> 24);
5138caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5148caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            prev_x += 1;
5158caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            next_x += 1;
5168caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        }
5178caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
51801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        int i0 = prev_x + py;
51901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        int i1 = next_x + ny;
52001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        int i2 = next_x + py;
52101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        int i3 = prev_x + ny;
52201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com
52301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#if UNROLL_KERNEL_LOOP
52401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        for (; x < dw - 2*rx - 4; x += 4) {
5258caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            SkASSERT(prev_x >= 0);
5268caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            SkASSERT(next_x <= sw);
5278caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
52801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            uint32_t tmp = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++];
52901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            *dst++ = SkToU8(tmp * scale >> 24);
53001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            tmp = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++];
53101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            *dst++ = SkToU8(tmp * scale >> 24);
53201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            tmp = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++];
53301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            *dst++ = SkToU8(tmp * scale >> 24);
53401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            tmp = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++];
53501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            *dst++ = SkToU8(tmp * scale >> 24);
5368caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
53701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            prev_x += 4;
53801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            next_x += 4;
53901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        }
54001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#endif
54101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com
54201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        for (; x < dw - 2*rx; x++) {
54301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            SkASSERT(prev_x >= 0);
54401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            SkASSERT(next_x <= sw);
54501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com
54601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            uint32_t tmp = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++];
5478caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            *dst++ = SkToU8(tmp * scale >> 24);
5488caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5498caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            prev_x += 1;
5508caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            next_x += 1;
5518caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        }
5528caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5538caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        for (; x < dw; x++) {
5548caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            SkASSERT(prev_x >= 0);
5558caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            SkASSERT(next_x > sw);
5568caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5578caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int px = prev_x;
5588caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int nx = sw;
5598caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5608caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            uint32_t tmp = sum[px+py] + sum[nx+ny] - sum[nx+py] - sum[px+ny];
5618caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            *dst++ = SkToU8(tmp * scale >> 24);
5628caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5638caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            prev_x += 1;
5648caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            next_x += 1;
5658caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        }
5668caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5678caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        prev_y += 1;
5688caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        next_y += 1;
5698caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    }
5708caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com}
5718caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5728caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com/**
5738caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * This is the path for apply_kernel_interp() to be taken when the kernel
5748caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * is wider than the source image.
5758caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com */
5768caac6447dd68655b57dfe876626a9733b191416tomhudson@google.comstatic void kernel_interp_clamped(uint8_t dst[], int rx, int ry,
5778caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                const uint32_t sum[], int sw, int sh, U8CPU outer_weight) {
5788caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    SkASSERT(2*rx > sw);
5798caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5808caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    int inner_weight = 255 - outer_weight;
5818caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5828caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    // round these guys up if they're bigger than 127
5838caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    outer_weight += outer_weight >> 7;
5848caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    inner_weight += inner_weight >> 7;
5858caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5868caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    uint32_t outer_scale = (outer_weight << 16) / ((2*rx + 1)*(2*ry + 1));
5878caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    uint32_t inner_scale = (inner_weight << 16) / ((2*rx - 1)*(2*ry - 1));
5888caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5898caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    int sumStride = sw + 1;
5908caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5918caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    int dw = sw + 2*rx;
5928caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    int dh = sh + 2*ry;
5938caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5948caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    int prev_y = -2*ry;
5958caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    int next_y = 1;
5968caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5978caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    for (int y = 0; y < dh; y++) {
5988caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        int py = SkClampPos(prev_y) * sumStride;
5998caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        int ny = SkFastMin32(next_y, sh) * sumStride;
6008caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
6018caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        int ipy = SkClampPos(prev_y + 1) * sumStride;
6028caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        int iny = SkClampMax(next_y - 1, sh) * sumStride;
6038caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
6048caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        int prev_x = -2*rx;
6058caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        int next_x = 1;
6068a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
6074560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com        for (int x = 0; x < dw; x++) {
6088a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            int px = SkClampPos(prev_x);
6098a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            int nx = SkFastMin32(next_x, sw);
6108a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
6118caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int ipx = SkClampPos(prev_x + 1);
6128caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int inx = SkClampMax(next_x - 1, sw);
6138caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
6148caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            uint32_t outer_sum = sum[px+py] + sum[nx+ny]
6158caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                               - sum[nx+py] - sum[px+ny];
6168caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            uint32_t inner_sum = sum[ipx+ipy] + sum[inx+iny]
6178caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                               - sum[inx+ipy] - sum[ipx+iny];
6188caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            *dst++ = SkToU8((outer_sum * outer_scale
6198caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                           + inner_sum * inner_scale) >> 24);
6208a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
6218a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            prev_x += 1;
6228a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            next_x += 1;
6238a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        }
6248a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        prev_y += 1;
6258a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        next_y += 1;
6268a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    }
6278a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com}
6288a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
62903016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com/**
63003016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com *  sw and sh are the width and height of the src. Since the sum buffer
63103016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com *  matches that, but has an extra row and col at the beginning (with zeros),
63203016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com *  we can just use sw and sh as our "max" values for pinning coordinates
63303016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com *  when sampling into sum[][]
6348caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *
6358caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *  The inner loop is conceptually simple; we break it into several variants
6368caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *  to improve performance. Here's the original version:
6378caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        for (int x = 0; x < dw; x++) {
6388caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int px = SkClampPos(prev_x);
6398caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int nx = SkFastMin32(next_x, sw);
6408caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
6418caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int ipx = SkClampPos(prev_x + 1);
6428caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int inx = SkClampMax(next_x - 1, sw);
6438caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
6448caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            uint32_t outer_sum = sum[px+py] + sum[nx+ny]
6458caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                               - sum[nx+py] - sum[px+ny];
6468caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            uint32_t inner_sum = sum[ipx+ipy] + sum[inx+iny]
6478caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                               - sum[inx+ipy] - sum[ipx+iny];
6488caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            *dst++ = SkToU8((outer_sum * outer_scale
6498caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                           + inner_sum * inner_scale) >> 24);
6508caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
6518caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            prev_x += 1;
6528caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            next_x += 1;
6538caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        }
65401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *  The sections are:
65501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *     left-hand section, where prev_x is clamped to 0
65601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *     center section, where neither prev_x nor next_x is clamped
65701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *     right-hand section, where next_x is clamped to sw
65801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *  On some operating systems, the center section is unrolled for additional
65901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *  speedup.
6608caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com*/
6614560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.comstatic void apply_kernel_interp(uint8_t dst[], int rx, int ry,
6624560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com                const uint32_t sum[], int sw, int sh, U8CPU outer_weight) {
6638a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    SkASSERT(rx > 0 && ry > 0);
6648a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    SkASSERT(outer_weight <= 255);
6658a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
6668caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    if (2*rx > sw) {
6678caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        kernel_interp_clamped(dst, rx, ry, sum, sw, sh, outer_weight);
6688caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        return;
6698caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    }
6708caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
6718a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    int inner_weight = 255 - outer_weight;
6728a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
6738a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    // round these guys up if they're bigger than 127
6748a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    outer_weight += outer_weight >> 7;
6758a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    inner_weight += inner_weight >> 7;
6768a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
6778a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    uint32_t outer_scale = (outer_weight << 16) / ((2*rx + 1)*(2*ry + 1));
6788a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    uint32_t inner_scale = (inner_weight << 16) / ((2*rx - 1)*(2*ry - 1));
6798a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
6804560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    int sumStride = sw + 1;
6818a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
6828a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    int dw = sw + 2*rx;
6838a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    int dh = sh + 2*ry;
6848a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
6854560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    int prev_y = -2*ry;
6864560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    int next_y = 1;
6878a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
6888caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    SkASSERT(2*rx <= dw - 2*rx);
6898caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
6904560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    for (int y = 0; y < dh; y++) {
6914560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com        int py = SkClampPos(prev_y) * sumStride;
6924560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com        int ny = SkFastMin32(next_y, sh) * sumStride;
6938a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
6944560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com        int ipy = SkClampPos(prev_y + 1) * sumStride;
6954560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com        int iny = SkClampMax(next_y - 1, sh) * sumStride;
6968a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
6974560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com        int prev_x = -2*rx;
6984560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com        int next_x = 1;
6998caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        int x = 0;
7008a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
7018caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        for (; x < 2*rx; x++) {
7028caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            SkASSERT(prev_x < 0);
7038caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            SkASSERT(next_x <= sw);
7048a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
7058caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int px = 0;
7068caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int nx = next_x;
7078caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
7088caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int ipx = 0;
7098caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int inx = next_x - 1;
7108caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
7118caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            uint32_t outer_sum = sum[px+py] + sum[nx+ny]
7128caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                               - sum[nx+py] - sum[px+ny];
7138caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            uint32_t inner_sum = sum[ipx+ipy] + sum[inx+iny]
7148caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                               - sum[inx+ipy] - sum[ipx+iny];
7158caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            *dst++ = SkToU8((outer_sum * outer_scale
7168caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                           + inner_sum * inner_scale) >> 24);
7178caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
7188caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            prev_x += 1;
7198caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            next_x += 1;
7208caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        }
7218caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
72201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        int i0 = prev_x + py;
72301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        int i1 = next_x + ny;
72401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        int i2 = next_x + py;
72501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        int i3 = prev_x + ny;
72601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        int i4 = prev_x + 1 + ipy;
72701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        int i5 = next_x - 1 + iny;
72801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        int i6 = next_x - 1 + ipy;
72901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        int i7 = prev_x + 1 + iny;
73001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com
73101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#if UNROLL_KERNEL_LOOP
73201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        for (; x < dw - 2*rx - 4; x += 4) {
7338caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            SkASSERT(prev_x >= 0);
7348caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            SkASSERT(next_x <= sw);
7358caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
73601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            uint32_t outer_sum = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++];
73701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            uint32_t inner_sum = sum[i4++] + sum[i5++] - sum[i6++] - sum[i7++];
73801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            *dst++ = SkToU8((outer_sum * outer_scale
73901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com                           + inner_sum * inner_scale) >> 24);
74001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            outer_sum = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++];
74101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            inner_sum = sum[i4++] + sum[i5++] - sum[i6++] - sum[i7++];
74201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            *dst++ = SkToU8((outer_sum * outer_scale
74301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com                           + inner_sum * inner_scale) >> 24);
74401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            outer_sum = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++];
74501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            inner_sum = sum[i4++] + sum[i5++] - sum[i6++] - sum[i7++];
74601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            *dst++ = SkToU8((outer_sum * outer_scale
74701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com                           + inner_sum * inner_scale) >> 24);
74801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            outer_sum = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++];
74901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            inner_sum = sum[i4++] + sum[i5++] - sum[i6++] - sum[i7++];
75001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            *dst++ = SkToU8((outer_sum * outer_scale
75101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com                           + inner_sum * inner_scale) >> 24);
7528caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
75301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            prev_x += 4;
75401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            next_x += 4;
75501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        }
75601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#endif
7578a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
75801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        for (; x < dw - 2*rx; x++) {
75901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            SkASSERT(prev_x >= 0);
76001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            SkASSERT(next_x <= sw);
76101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com
76201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            uint32_t outer_sum = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++];
76301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            uint32_t inner_sum = sum[i4++] + sum[i5++] - sum[i6++] - sum[i7++];
7648caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            *dst++ = SkToU8((outer_sum * outer_scale
7658caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                           + inner_sum * inner_scale) >> 24);
7668a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
7678a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            prev_x += 1;
7688a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            next_x += 1;
7698a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        }
7708caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
7718caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        for (; x < dw; x++) {
7728caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            SkASSERT(prev_x >= 0);
7738caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            SkASSERT(next_x > sw);
7748caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
7758caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int px = prev_x;
7768caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int nx = sw;
7778caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
7788caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int ipx = prev_x + 1;
7798caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int inx = sw;
7808caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
7818caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            uint32_t outer_sum = sum[px+py] + sum[nx+ny]
7828caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                               - sum[nx+py] - sum[px+ny];
7838caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            uint32_t inner_sum = sum[ipx+ipy] + sum[inx+iny]
7848caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                               - sum[inx+ipy] - sum[ipx+iny];
7858caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            *dst++ = SkToU8((outer_sum * outer_scale
7868caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                           + inner_sum * inner_scale) >> 24);
7878caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
7888caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            prev_x += 1;
7898caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            next_x += 1;
7908caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        }
7918caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
7928a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        prev_y += 1;
7938a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        next_y += 1;
7948a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    }
7958a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com}
7968a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
7978a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com#include "SkColorPriv.h"
7988a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
7990e3c664250f561ec9f7107b92136517a72d03afdreed@android.comstatic void merge_src_with_blur(uint8_t dst[], int dstRB,
8000e3c664250f561ec9f7107b92136517a72d03afdreed@android.com                                const uint8_t src[], int srcRB,
8010e3c664250f561ec9f7107b92136517a72d03afdreed@android.com                                const uint8_t blur[], int blurRB,
8020e3c664250f561ec9f7107b92136517a72d03afdreed@android.com                                int sw, int sh) {
8030e3c664250f561ec9f7107b92136517a72d03afdreed@android.com    dstRB -= sw;
8040e3c664250f561ec9f7107b92136517a72d03afdreed@android.com    srcRB -= sw;
8050e3c664250f561ec9f7107b92136517a72d03afdreed@android.com    blurRB -= sw;
8060e3c664250f561ec9f7107b92136517a72d03afdreed@android.com    while (--sh >= 0) {
8070e3c664250f561ec9f7107b92136517a72d03afdreed@android.com        for (int x = sw - 1; x >= 0; --x) {
8088a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            *dst = SkToU8(SkAlphaMul(*blur, SkAlpha255To256(*src)));
8098a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            dst += 1;
8108a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            src += 1;
8118a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            blur += 1;
8128a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        }
8130e3c664250f561ec9f7107b92136517a72d03afdreed@android.com        dst += dstRB;
8140e3c664250f561ec9f7107b92136517a72d03afdreed@android.com        src += srcRB;
8150e3c664250f561ec9f7107b92136517a72d03afdreed@android.com        blur += blurRB;
8168a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    }
8178a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com}
8188a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
8198a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.comstatic void clamp_with_orig(uint8_t dst[], int dstRowBytes,
8200e3c664250f561ec9f7107b92136517a72d03afdreed@android.com                            const uint8_t src[], int srcRowBytes,
8210e3c664250f561ec9f7107b92136517a72d03afdreed@android.com                            int sw, int sh,
8224560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com                            SkBlurMask::Style style) {
8238a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    int x;
8240e3c664250f561ec9f7107b92136517a72d03afdreed@android.com    while (--sh >= 0) {
8258a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        switch (style) {
8268a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        case SkBlurMask::kSolid_Style:
8270e3c664250f561ec9f7107b92136517a72d03afdreed@android.com            for (x = sw - 1; x >= 0; --x) {
8280e3c664250f561ec9f7107b92136517a72d03afdreed@android.com                int s = *src;
8290e3c664250f561ec9f7107b92136517a72d03afdreed@android.com                int d = *dst;
8300e3c664250f561ec9f7107b92136517a72d03afdreed@android.com                *dst = SkToU8(s + d - SkMulDiv255Round(s, d));
8318a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com                dst += 1;
8328a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com                src += 1;
8338a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            }
8348a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            break;
8358a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        case SkBlurMask::kOuter_Style:
8360e3c664250f561ec9f7107b92136517a72d03afdreed@android.com            for (x = sw - 1; x >= 0; --x) {
8370e3c664250f561ec9f7107b92136517a72d03afdreed@android.com                if (*src) {
8388a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com                    *dst = SkToU8(SkAlphaMul(*dst, SkAlpha255To256(255 - *src)));
8390e3c664250f561ec9f7107b92136517a72d03afdreed@android.com                }
8408a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com                dst += 1;
8418a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com                src += 1;
8428a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            }
8438a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            break;
8448a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        default:
8450c00f21fee3f5cfa3aa7e5d46ff94cb8cf340451tomhudson@google.com            SkDEBUGFAIL("Unexpected blur style here");
8468a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            break;
8478a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        }
8488a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        dst += dstRowBytes - sw;
8490e3c664250f561ec9f7107b92136517a72d03afdreed@android.com        src += srcRowBytes - sw;
8508a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    }
8518a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com}
8528a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
85303016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com///////////////////////////////////////////////////////////////////////////////
8548a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
8558a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com// we use a local funciton to wrap the class static method to work around
8568a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com// a bug in gcc98
8578a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.comvoid SkMask_FreeImage(uint8_t* image);
85803016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.comvoid SkMask_FreeImage(uint8_t* image) {
8598a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    SkMask::FreeImage(image);
8608a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com}
8618a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
8628a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.combool SkBlurMask::Blur(SkMask* dst, const SkMask& src,
8635af16f8d670b3ce1c7644a4737e02e2e2257614ebungeman@google.com                      SkScalar radius, Style style, Quality quality,
86471f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org                      SkIPoint* margin, bool separable)
8655af16f8d670b3ce1c7644a4737e02e2e2257614ebungeman@google.com{
86603016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com    if (src.fFormat != SkMask::kA8_Format) {
8678a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        return false;
86803016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com    }
8698a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
8704868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org    // Force high quality off for small radii (performance)
87191f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org    if (radius < SkIntToScalar(3)) {
87291f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org        quality = kLow_Quality;
87391f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org    }
8744868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org
8754868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org    // highQuality: use three box blur passes as a cheap way to approximate a Gaussian blur
87691f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org    int passCount = (kHigh_Quality == quality) ? 3 : 1;
8777c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    SkScalar passRadius = (kHigh_Quality == quality) ? SkScalarMul( radius, kBlurRadiusFudgeFactor): radius;
8784868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org
8794868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org    int rx = SkScalarCeil(passRadius);
8804868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org    int outer_weight = 255 - SkScalarRound((SkIntToScalar(rx) - passRadius) * 255);
8818a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
8828a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    SkASSERT(rx >= 0);
8838a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    SkASSERT((unsigned)outer_weight <= 255);
8840e3c664250f561ec9f7107b92136517a72d03afdreed@android.com    if (rx <= 0) {
8858a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        return false;
8860e3c664250f561ec9f7107b92136517a72d03afdreed@android.com    }
8878a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
8888a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    int ry = rx;    // only do square blur for now
8898a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
8904868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org    int padx = passCount * rx;
8914868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org    int pady = passCount * ry;
8925af16f8d670b3ce1c7644a4737e02e2e2257614ebungeman@google.com    if (margin) {
8935af16f8d670b3ce1c7644a4737e02e2e2257614ebungeman@google.com        margin->set(padx, pady);
8945af16f8d670b3ce1c7644a4737e02e2e2257614ebungeman@google.com    }
8954868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org    dst->fBounds.set(src.fBounds.fLeft - padx, src.fBounds.fTop - pady,
8964868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org        src.fBounds.fRight + padx, src.fBounds.fBottom + pady);
89749f0ff25a046d6001dc2d095b6fa3c30f0f46b6areed@android.com    dst->fRowBytes = dst->fBounds.width();
8988a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    dst->fFormat = SkMask::kA8_Format;
8998a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    dst->fImage = NULL;
9008a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
9010e3c664250f561ec9f7107b92136517a72d03afdreed@android.com    if (src.fImage) {
902543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com        size_t dstSize = dst->computeImageSize();
903543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com        if (0 == dstSize) {
904543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com            return false;   // too big to allocate, abort
905543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com        }
906543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com
9078a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        int             sw = src.fBounds.width();
9088a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        int             sh = src.fBounds.height();
9098a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        const uint8_t*  sp = src.fImage;
910543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com        uint8_t*        dp = SkMask::AllocImage(dstSize);
9118a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
9128a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        SkAutoTCallVProc<uint8_t, SkMask_FreeImage> autoCall(dp);
9138a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
9148a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        // build the blurry destination
91571f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org        if (separable) {
91671f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org            SkAutoTMalloc<uint8_t>  tmpBuffer(dstSize);
91771f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org            uint8_t*                tp = tmpBuffer.get();
91871f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org            int w = sw, h = sh;
91971f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org
92091f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org            if (outer_weight == 255) {
921c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org                int loRadius, hiRadius;
922c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org                get_adjusted_radii(passRadius, &loRadius, &hiRadius);
92391f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                if (kHigh_Quality == quality) {
92491f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    // Do three X blurs, with a transpose on the final one.
92591f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    w = boxBlur(sp, src.fRowBytes, tp, loRadius, hiRadius, w, h, false);
92691f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    w = boxBlur(tp, w,             dp, hiRadius, loRadius, w, h, false);
92791f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    w = boxBlur(dp, w,             tp, hiRadius, hiRadius, w, h, true);
92891f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    // Do three Y blurs, with a transpose on the final one.
92991f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    h = boxBlur(tp, h,             dp, loRadius, hiRadius, h, w, false);
93091f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    h = boxBlur(dp, h,             tp, hiRadius, loRadius, h, w, false);
93191f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    h = boxBlur(tp, h,             dp, hiRadius, hiRadius, h, w, true);
93291f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                } else {
93391f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    w = boxBlur(sp, src.fRowBytes, tp, rx, rx, w, h, true);
93491f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    h = boxBlur(tp, h,             dp, ry, ry, h, w, true);
93591f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                }
936908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org            } else {
93791f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                if (kHigh_Quality == quality) {
93891f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    // Do three X blurs, with a transpose on the final one.
93991f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    w = boxBlurInterp(sp, src.fRowBytes, tp, rx, w, h, false, outer_weight);
94091f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    w = boxBlurInterp(tp, w,             dp, rx, w, h, false, outer_weight);
94191f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    w = boxBlurInterp(dp, w,             tp, rx, w, h, true, outer_weight);
94291f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    // Do three Y blurs, with a transpose on the final one.
94391f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    h = boxBlurInterp(tp, h,             dp, ry, h, w, false, outer_weight);
94491f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    h = boxBlurInterp(dp, h,             tp, ry, h, w, false, outer_weight);
94591f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    h = boxBlurInterp(tp, h,             dp, ry, h, w, true, outer_weight);
94691f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                } else {
94791f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    w = boxBlurInterp(sp, src.fRowBytes, tp, rx, w, h, true, outer_weight);
94891f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    h = boxBlurInterp(tp, h,             dp, ry, h, w, true, outer_weight);
94991f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                }
95071f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org            }
95171f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org        } else {
95203016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com            const size_t storageW = sw + 2 * (passCount - 1) * rx + 1;
95303016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com            const size_t storageH = sh + 2 * (passCount - 1) * ry + 1;
95403016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com            SkAutoTMalloc<uint32_t> storage(storageW * storageH);
9558a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            uint32_t*               sumBuffer = storage.get();
9568a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
9574868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org            //pass1: sp is source, dp is destination
9588a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            build_sum_buffer(sumBuffer, sw, sh, sp, src.fRowBytes);
95903016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com            if (outer_weight == 255) {
9608a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com                apply_kernel(dp, rx, ry, sumBuffer, sw, sh);
96103016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com            } else {
9628a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com                apply_kernel_interp(dp, rx, ry, sumBuffer, sw, sh, outer_weight);
96303016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com            }
9644868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org
96591f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org            if (kHigh_Quality == quality) {
9664868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                //pass2: dp is source, tmpBuffer is destination
9674868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                int tmp_sw = sw + 2 * rx;
9684868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                int tmp_sh = sh + 2 * ry;
9694868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                SkAutoTMalloc<uint8_t>  tmpBuffer(dstSize);
9704868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                build_sum_buffer(sumBuffer, tmp_sw, tmp_sh, dp, tmp_sw);
9714868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                if (outer_weight == 255)
9724868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                    apply_kernel(tmpBuffer.get(), rx, ry, sumBuffer, tmp_sw, tmp_sh);
9734868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                else
97403016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com                    apply_kernel_interp(tmpBuffer.get(), rx, ry, sumBuffer,
97503016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com                                        tmp_sw, tmp_sh, outer_weight);
9764868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org
9774868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                //pass3: tmpBuffer is source, dp is destination
9784868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                tmp_sw += 2 * rx;
9794868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                tmp_sh += 2 * ry;
9804868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                build_sum_buffer(sumBuffer, tmp_sw, tmp_sh, tmpBuffer.get(), tmp_sw);
9814868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                if (outer_weight == 255)
9824868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                    apply_kernel(dp, rx, ry, sumBuffer, tmp_sw, tmp_sh);
9834868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                else
98403016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com                    apply_kernel_interp(dp, rx, ry, sumBuffer, tmp_sw, tmp_sh,
98503016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com                                        outer_weight);
9864868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org            }
9878a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        }
9888a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
9898a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        dst->fImage = dp;
9908a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        // if need be, alloc the "real" dst (same size as src) and copy/merge
9918a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        // the blur into it (applying the src)
9920e3c664250f561ec9f7107b92136517a72d03afdreed@android.com        if (style == kInner_Style) {
9930e3c664250f561ec9f7107b92136517a72d03afdreed@android.com            // now we allocate the "real" dst, mirror the size of src
994543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com            size_t srcSize = src.computeImageSize();
995543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com            if (0 == srcSize) {
996543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com                return false;   // too big to allocate, abort
997543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com            }
998543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com            dst->fImage = SkMask::AllocImage(srcSize);
9990e3c664250f561ec9f7107b92136517a72d03afdreed@android.com            merge_src_with_blur(dst->fImage, src.fRowBytes,
10000e3c664250f561ec9f7107b92136517a72d03afdreed@android.com                                sp, src.fRowBytes,
100103016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com                                dp + passCount * (rx + ry * dst->fRowBytes),
100203016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com                                dst->fRowBytes, sw, sh);
10038a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            SkMask::FreeImage(dp);
10040e3c664250f561ec9f7107b92136517a72d03afdreed@android.com        } else if (style != kNormal_Style) {
100503016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com            clamp_with_orig(dp + passCount * (rx + ry * dst->fRowBytes),
100603016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com                            dst->fRowBytes, sp, src.fRowBytes, sw, sh, style);
10078a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        }
10088a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        (void)autoCall.detach();
10098a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    }
10108a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
10110e3c664250f561ec9f7107b92136517a72d03afdreed@android.com    if (style == kInner_Style) {
10128a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        dst->fBounds = src.fBounds; // restore trimmed bounds
10130e3c664250f561ec9f7107b92136517a72d03afdreed@android.com        dst->fRowBytes = src.fRowBytes;
10148a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    }
10158a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
10168a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    return true;
10178a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com}
10188a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
101971f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.orgbool SkBlurMask::BlurSeparable(SkMask* dst, const SkMask& src,
102071f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org                               SkScalar radius, Style style, Quality quality,
102171f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org                               SkIPoint* margin)
102271f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org{
102371f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org    return SkBlurMask::Blur(dst, src, radius, style, quality, margin, true);
102471f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org}
102571f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org
102671f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.orgbool SkBlurMask::Blur(SkMask* dst, const SkMask& src,
102771f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org                     SkScalar radius, Style style, Quality quality,
102871f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org                     SkIPoint* margin)
102971f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org{
103071f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org    return SkBlurMask::Blur(dst, src, radius, style, quality, margin, false);
103171f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org}
10327c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
10337c7292c6071898d73dc935c3b66b9816183806f0humper@google.com/* Convolving a box with itself three times results in a piecewise
10347c7292c6071898d73dc935c3b66b9816183806f0humper@google.com   quadratic function:
10358ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
10367c7292c6071898d73dc935c3b66b9816183806f0humper@google.com   0                              x <= -1.5
10377c7292c6071898d73dc935c3b66b9816183806f0humper@google.com   9/8 + 3/2 x + 1/2 x^2   -1.5 < x <= 1.5
10387c7292c6071898d73dc935c3b66b9816183806f0humper@google.com   3/4 - x^2                -.5 < x <= .5
10397c7292c6071898d73dc935c3b66b9816183806f0humper@google.com   9/8 - 3/2 x + 1/2 x^2    0.5 < x <= 1.5
10407c7292c6071898d73dc935c3b66b9816183806f0humper@google.com   0                        1.5 < x
10418ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
10427c7292c6071898d73dc935c3b66b9816183806f0humper@google.com   To get the profile curve of the blurred step function at the rectangle
10437c7292c6071898d73dc935c3b66b9816183806f0humper@google.com   edge, we evaluate the indefinite integral, which is piecewise cubic:
10448ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
10457c7292c6071898d73dc935c3b66b9816183806f0humper@google.com   0                                        x <= -1.5
10467c7292c6071898d73dc935c3b66b9816183806f0humper@google.com   5/8 + 9/8 x + 3/4 x^2 + 1/6 x^3   -1.5 < x <= -0.5
10477c7292c6071898d73dc935c3b66b9816183806f0humper@google.com   1/2 + 3/4 x - 1/3 x^3              -.5 < x <= .5
10487c7292c6071898d73dc935c3b66b9816183806f0humper@google.com   3/8 + 9/8 x - 3/4 x^2 + 1/6 x^3     .5 < x <= 1.5
10497c7292c6071898d73dc935c3b66b9816183806f0humper@google.com   1                                  1.5 < x
10507c7292c6071898d73dc935c3b66b9816183806f0humper@google.com*/
10517c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
10527c7292c6071898d73dc935c3b66b9816183806f0humper@google.comstatic float gaussian_integral( float x ) {
10537c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    if ( x > 1.5f ) {
10547c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        return 0.0f;
10557c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    }
10567c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    if ( x < -1.5f ) {
10577c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        return 1.0f;
10587c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    }
10597c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
10607c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    float x2 = x*x;
10617c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    float x3 = x2*x;
10627c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
10639c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com    if ( x > 0.5f ) {
10649c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com        return 0.5625f - ( x3 / 6.0f - 3.0f * x2 * 0.25f + 1.125f * x);
10657c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    }
10669c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com    if ( x > -0.5f ) {
10679c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com        return 0.5f - (0.75f * x - x3 / 3.0f);
10687c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    }
10699c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com    return 0.4375f + (-x3 / 6.0f - 3.0f * x2 * 0.25f - 1.125f * x);
10707c7292c6071898d73dc935c3b66b9816183806f0humper@google.com}
10717c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
10728ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com/*
10737c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    compute_profile allocates and fills in an array of floating
10748ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com    point values between 0 and 255 for the profile signature of
10757c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    a blurred half-plane with the given blur radius.  Since we're
10767c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    going to be doing screened multiplications (i.e., 1 - (1-x)(1-y))
10777c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    all the time, we actually fill in the profile pre-inverted
10787c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    (already done 255-x).
10798ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
10807c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    The function returns the size of the array allocated for the
10818ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com    profile.  It's the responsibility of the caller to delete the
10827c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    memory returned in profile_out.
10837c7292c6071898d73dc935c3b66b9816183806f0humper@google.com*/
10847c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
10857c7292c6071898d73dc935c3b66b9816183806f0humper@google.comstatic int compute_profile( SkScalar radius, unsigned int **profile_out ) {
10869c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com    int size = SkScalarFloorToInt(radius * 3 + 1);
10877c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    int center = size >> 1;
10887c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
10897c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    unsigned int *profile = new unsigned int [size];
10907c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
10917c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    float invr = 1.0f/radius;
10927c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
10937c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    profile[0] = 255;
10947c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    for (int x = 1 ; x < size ; x++) {
10957c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        float scaled_x = ( center - x ) * invr;
10967c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        float gi = gaussian_integral( scaled_x );
10977c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        profile[x] = 255 - (uint8_t) ( 255.f * gi );
10987c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    }
10997c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
11007c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    *profile_out = profile;
11017c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    return size;
11027c7292c6071898d73dc935c3b66b9816183806f0humper@google.com}
11037c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
11048ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com// TODO MAYBE: Maintain a profile cache to avoid recomputing this for
11057c7292c6071898d73dc935c3b66b9816183806f0humper@google.com// commonly used radii.  Consider baking some of the most common blur radii
11067c7292c6071898d73dc935c3b66b9816183806f0humper@google.com// directly in as static data?
11077c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
11087c7292c6071898d73dc935c3b66b9816183806f0humper@google.com// Implementation adapted from Michael Herf's approach:
11097c7292c6071898d73dc935c3b66b9816183806f0humper@google.com// http://stereopsis.com/shadowrect/
11107c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
11117c7292c6071898d73dc935c3b66b9816183806f0humper@google.combool SkBlurMask::BlurRect(SkMask *dst, const SkRect &src,
11127c7292c6071898d73dc935c3b66b9816183806f0humper@google.com                          SkScalar provided_radius, Style style, Quality quality,
11137c7292c6071898d73dc935c3b66b9816183806f0humper@google.com                          SkIPoint *margin) {
11147c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    int profile_size;
11157c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    unsigned int *profile;
11168ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
11178ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
11187c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    float radius = SkScalarToFloat( SkScalarMul( provided_radius, kBlurRadiusFudgeFactor ) );
11198ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
11207c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    profile_size = compute_profile( radius, &profile );
11218ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
11227c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    int pad = (int) (radius * 1.5f + 1);
11237c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    if (margin) {
11247c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        margin->set( pad, pad );
11257c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    }
11269c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com    dst->fBounds = SkIRect::MakeWH(SkScalarFloorToInt(src.width()), SkScalarFloorToInt(src.height()));
11277c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    dst->fBounds.outset(pad, pad);
11288ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
11297c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    dst->fRowBytes = dst->fBounds.width();
11307c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    dst->fFormat = SkMask::kA8_Format;
11317c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    dst->fImage = NULL;
11328ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
11337c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    size_t dstSize = dst->computeImageSize();
11347c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    if (0 == dstSize) {
11357c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        return false;   // too big to allocate, abort
11367c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    }
11378ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
11389c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com    int             sw = SkScalarFloorToInt(src.width());
11399c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com    int             sh = SkScalarFloorToInt(src.height());
11408ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
11417c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    uint8_t*        dp = SkMask::AllocImage(dstSize);
11428ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
11437c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    dst->fImage = dp;
11448ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
11457c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    SkAutoTCallVProc<uint8_t, SkMask_FreeImage> autoCall(dp);
11468ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
11477c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    int dst_height = dst->fBounds.height();
11487c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    int dst_width = dst->fBounds.width();
11498ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
11507c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    // nearest odd number less than the profile size represents the center
11517c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    // of the (2x scaled) profile
11527c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    int center = ( profile_size & ~1 ) - 1;
11538ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
11547c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    int w = sw - center;
11557c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    int h = sh - center;
11568ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
11577c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    uint8_t *outptr = dp;
11588ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
11597c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    for (int y = 0 ; y < dst_height ; y++)
11607c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    {
11617c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        // time to fill in a scanline of the blurry rectangle.
11627c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        // to avoid floating point math, everything is multiplied by
11637c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        // 2 where needed.  This keeps things nice and integer-oriented.
11648ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
11657c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        int dy = abs((y << 1) - dst_height) - h; // how far are we from the original edge?
11667c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        int oy = dy >> 1;
11677c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        if (oy < 0) oy = 0;
11688ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
11697c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        unsigned int profile_y = profile[oy];
11708ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
11717c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        for (int x = 0 ; x < (dst_width << 1) ; x += 2) {
11727c7292c6071898d73dc935c3b66b9816183806f0humper@google.com            int dx = abs( x - dst_width ) - w;
11737c7292c6071898d73dc935c3b66b9816183806f0humper@google.com            int ox = dx >> 1;
11747c7292c6071898d73dc935c3b66b9816183806f0humper@google.com            if (ox < 0) ox = 0;
11758ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
11767c7292c6071898d73dc935c3b66b9816183806f0humper@google.com            unsigned int maskval = SkMulDiv255Round(profile[ox], profile_y);
11778ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
11787c7292c6071898d73dc935c3b66b9816183806f0humper@google.com            *(outptr++) = maskval;
11797c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        }
11807c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    }
11818ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
11827c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    return true;
11837c7292c6071898d73dc935c3b66b9816183806f0humper@google.com}
1184