SkBlurMask.cpp revision 76bf70d38fd109a09ee44d074cfd392e1884afff
1ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com
2ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com/*
3ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com * Copyright 2006 The Android Open Source Project
4ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com *
5ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com * Use of this source code is governed by a BSD-style license that can be
6ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com * found in the LICENSE file.
7ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com */
8ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com
98a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
108a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com#include "SkBlurMask.h"
11889bd8bd7f604acae0a6303365bc82c06da1e6f3tomhudson@google.com#include "SkMath.h"
128a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com#include "SkTemplates.h"
1301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#include "SkEndian.h"
1401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com
158ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com// scale factor for the blur radius to match the behavior of the all existing blur
167c7292c6071898d73dc935c3b66b9816183806f0humper@google.com// code (both on the CPU and the GPU).  This magic constant is  1/sqrt(3).
177c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
188ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com// TODO: get rid of this fudge factor and move any required fudging up into
197c7292c6071898d73dc935c3b66b9816183806f0humper@google.com// the calling library
207c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
217c7292c6071898d73dc935c3b66b9816183806f0humper@google.com#define kBlurRadiusFudgeFactor SkFloatToScalar( .57735f )
227c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
239b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define UNROLL_SEPARABLE_LOOPS
249b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org
25908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org/**
26908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org * This function performs a box blur in X, of the given radius.  If the
27884e60be30e20f38b3466a4697081187d2f1f814skia.committer@gmail.com * "transpose" parameter is true, it will transpose the pixels on write,
28908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org * such that X and Y are swapped. Reads are always performed from contiguous
29908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org * memory in X, for speed. The destination buffer (dst) must be at least
309b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org * (width + leftRadius + rightRadius) * height bytes in size.
314a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *
324a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * This is what the inner loop looks like before unrolling, and with the two
334a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * cases broken out separately (width < diameter, width >= diameter):
3476bf70d38fd109a09ee44d074cfd392e1884afffskia.committer@gmail.com *
354a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *      if (width < diameter) {
364a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *          for (int x = 0; x < width; ++x) {
374a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              sum += *right++;
3876bf70d38fd109a09ee44d074cfd392e1884afffskia.committer@gmail.com *              *dptr = (sum * scale + half) >> 24;
394a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              dptr += dst_x_stride;
404a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *          }
414a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *          for (int x = width; x < diameter; ++x) {
424a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              *dptr = (sum * scale + half) >> 24;
434a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              dptr += dst_x_stride;
444a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *          }
454a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *          for (int x = 0; x < width; ++x) {
464a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              *dptr = (sum * scale + half) >> 24;
474a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              sum -= *left++;
484a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              dptr += dst_x_stride;
494a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *          }
504a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *      } else {
514a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *          for (int x = 0; x < diameter; ++x) {
524a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              sum += *right++;
534a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              *dptr = (sum * scale + half) >> 24;
544a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              dptr += dst_x_stride;
554a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *          }
564a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *          for (int x = diameter; x < width; ++x) {
574a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              sum += *right++;
584a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              *dptr = (sum * scale + half) >> 24;
594a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              sum -= *left++;
604a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              dptr += dst_x_stride;
614a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *          }
624a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *          for (int x = 0; x < diameter; ++x) {
634a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              *dptr = (sum * scale + half) >> 24;
644a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              sum -= *left++;
654a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              dptr += dst_x_stride;
664a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *          }
674a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *      }
68908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org */
69908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.orgstatic int boxBlur(const uint8_t* src, int src_y_stride, uint8_t* dst,
70c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org                   int leftRadius, int rightRadius, int width, int height,
71c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org                   bool transpose)
7271f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org{
739b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    int diameter = leftRadius + rightRadius;
749b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    int kernelSize = diameter + 1;
759b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    int border = SkMin32(width, diameter);
7671f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org    uint32_t scale = (1 << 24) / kernelSize;
77c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org    int new_width = width + SkMax32(leftRadius, rightRadius) * 2;
78908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org    int dst_x_stride = transpose ? height : 1;
79908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org    int dst_y_stride = transpose ? 1 : new_width;
804a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org#ifndef SK_DISABLE_BLUR_ROUNDING
814a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org    uint32_t half = 1 << 23;
824a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org#else
834a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org    uint32_t half = 0;
844a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org#endif
8571f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org    for (int y = 0; y < height; ++y) {
864a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org        uint32_t sum = 0;
87908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org        uint8_t* dptr = dst + y * dst_y_stride;
88908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org        const uint8_t* right = src + y * src_y_stride;
89908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org        const uint8_t* left = right;
90336b4da6b0d20f27f9980b03415354a2f0698e18senorblanco@chromium.org        for (int x = 0; x < rightRadius - leftRadius; x++) {
91336b4da6b0d20f27f9980b03415354a2f0698e18senorblanco@chromium.org            *dptr = 0;
92336b4da6b0d20f27f9980b03415354a2f0698e18senorblanco@chromium.org            dptr += dst_x_stride;
93c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org        }
949b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define LEFT_BORDER_ITER \
959b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            sum += *right++; \
964a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org            *dptr = (sum * scale + half) >> 24; \
97908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org            dptr += dst_x_stride;
989b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org
999b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        int x = 0;
1009b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS
1019b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (; x < border - 16; x += 16) {
1029b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
1039b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
1049b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
1059b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
1069b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
1079b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
1089b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
1099b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
1109b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
1119b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
1129b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
1139b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
1149b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
1159b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
1169b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
1179b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
11871f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org        }
1199b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif
1209b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (; x < border; ++x) {
1219b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
1229b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        }
1239b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef LEFT_BORDER_ITER
1249b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define TRIVIAL_ITER \
1254a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org            *dptr = (sum * scale + half) >> 24; \
126908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org            dptr += dst_x_stride;
1279b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        x = width;
1289b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS
1299b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (; x < diameter - 16; x += 16) {
1309b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
1319b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
1329b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
1339b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
1349b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
1359b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
1369b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
1379b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
1389b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
1399b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
1409b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
1419b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
1429b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
1439b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
1449b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
1459b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
1469b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        }
1479b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif
1489b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (; x < diameter; ++x) {
1499b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            TRIVIAL_ITER
15071f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org        }
1519b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef TRIVIAL_ITER
1529b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define CENTER_ITER \
1539b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            sum += *right++; \
1544a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org            *dptr = (sum * scale + half) >> 24; \
1559b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            sum -= *left++; \
156908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org            dptr += dst_x_stride;
1579b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org
1589b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        x = diameter;
1599b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS
1609b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (; x < width - 16; x += 16) {
1619b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1629b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1639b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1649b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1659b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1669b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1679b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1689b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1699b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1709b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1719b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1729b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1739b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1749b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1759b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1769b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
1779b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        }
1789b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif
1799b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (; x < width; ++x) {
1809b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
18171f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org        }
1829b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef CENTER_ITER
1839b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define RIGHT_BORDER_ITER \
1844a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org            *dptr = (sum * scale + half) >> 24; \
1859b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            sum -= *left++; \
186908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org            dptr += dst_x_stride;
1879b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org
1889b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        x = 0;
1899b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS
1909b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (; x < border - 16; x += 16) {
1919b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
1929b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
1939b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
1949b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
1959b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
1969b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
1979b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
1989b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
1999b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
2009b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
2019b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
2029b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
2039b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
2049b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
2059b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
2069b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
2079b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        }
2089b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif
2099b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (; x < border; ++x) {
2109b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
21171f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org        }
2129b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef RIGHT_BORDER_ITER
213336b4da6b0d20f27f9980b03415354a2f0698e18senorblanco@chromium.org        for (int x = 0; x < leftRadius - rightRadius; x++) {
214336b4da6b0d20f27f9980b03415354a2f0698e18senorblanco@chromium.org            *dptr = 0;
215336b4da6b0d20f27f9980b03415354a2f0698e18senorblanco@chromium.org            dptr += dst_x_stride;
216c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org        }
21771f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org        SkASSERT(sum == 0);
21871f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org    }
219908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org    return new_width;
22071f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org}
22171f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org
2229b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org/**
2239b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org * This variant of the box blur handles blurring of non-integer radii.  It
2249b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org * keeps two running sums: an outer sum for the rounded-up kernel radius, and
2259b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org * an inner sum for the rounded-down kernel radius.  For each pixel, it linearly
2269b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org * interpolates between them.  In float this would be:
2279b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org *  outer_weight * outer_sum / kernelSize +
2289b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org *  (1.0 - outer_weight) * innerSum / (kernelSize - 2)
22976bf70d38fd109a09ee44d074cfd392e1884afffskia.committer@gmail.com *
2304a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * This is what the inner loop looks like before unrolling, and with the two
2314a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * cases broken out separately (width < diameter, width >= diameter):
23276bf70d38fd109a09ee44d074cfd392e1884afffskia.committer@gmail.com *
2334a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *      if (width < diameter) {
2344a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *          for (int x = 0; x < width; x++) {
2354a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              inner_sum = outer_sum;
2364a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              outer_sum += *right++;
2374a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              *dptr = (outer_sum * outer_scale + inner_sum * inner_scale + half) >> 24;
2384a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              dptr += dst_x_stride;
2394a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *          }
2404a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *          for (int x = width; x < diameter; ++x) {
2414a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              *dptr = (outer_sum * outer_scale + inner_sum * inner_scale + half) >> 24;
2424a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              dptr += dst_x_stride;
2434a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *          }
2444a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *          for (int x = 0; x < width; x++) {
2454a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              inner_sum = outer_sum - *left++;
2464a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              *dptr = (outer_sum * outer_scale + inner_sum * inner_scale + half) >> 24;
2474a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              dptr += dst_x_stride;
2484a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              outer_sum = inner_sum;
2494a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *          }
2504a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *      } else {
2514a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *          for (int x = 0; x < diameter; x++) {
2524a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              inner_sum = outer_sum;
2534a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              outer_sum += *right++;
2544a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              *dptr = (outer_sum * outer_scale + inner_sum * inner_scale + half) >> 24;
2554a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              dptr += dst_x_stride;
2564a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *          }
2574a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *          for (int x = diameter; x < width; ++x) {
2584a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              inner_sum = outer_sum - *left;
2594a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              outer_sum += *right++;
2604a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              *dptr = (outer_sum * outer_scale + inner_sum * inner_scale + half) >> 24;
2614a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              dptr += dst_x_stride;
2624a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              outer_sum -= *left++;
2634a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *          }
2644a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *          for (int x = 0; x < diameter; x++) {
2654a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              inner_sum = outer_sum - *left++;
2664a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              *dptr = (outer_sum * outer_scale + inner_sum * inner_scale + half) >> 24;
2674a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              dptr += dst_x_stride;
2684a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *              outer_sum = inner_sum;
2694a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *          }
2704a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *      }
2714a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *  }
2724a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *  return new_width;
2739b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org */
2744a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org
2759b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.orgstatic int boxBlurInterp(const uint8_t* src, int src_y_stride, uint8_t* dst,
2769b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org                         int radius, int width, int height,
2779b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org                         bool transpose, uint8_t outer_weight)
2789b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org{
2799b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    int diameter = radius * 2;
2809b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    int kernelSize = diameter + 1;
2819b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    int border = SkMin32(width, diameter);
2829b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    int inner_weight = 255 - outer_weight;
2839b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    outer_weight += outer_weight >> 7;
2849b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    inner_weight += inner_weight >> 7;
2859b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    uint32_t outer_scale = (outer_weight << 16) / kernelSize;
2869b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    uint32_t inner_scale = (inner_weight << 16) / (kernelSize - 2);
2874a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org#ifndef SK_DISABLE_BLUR_ROUNDING
2884a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org    uint32_t half = 1 << 23;
2894a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org#else
2904a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org    uint32_t half = 0;
2914a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org#endif
2929b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    int new_width = width + diameter;
2939b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    int dst_x_stride = transpose ? height : 1;
2949b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    int dst_y_stride = transpose ? 1 : new_width;
2959b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    for (int y = 0; y < height; ++y) {
2964a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org        uint32_t outer_sum = 0, inner_sum = 0;
2979b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        uint8_t* dptr = dst + y * dst_y_stride;
2989b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        const uint8_t* right = src + y * src_y_stride;
2999b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        const uint8_t* left = right;
3009b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        int x = 0;
3019b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org
3029b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define LEFT_BORDER_ITER \
3039b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            inner_sum = outer_sum; \
3049b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            outer_sum += *right++; \
3054a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org            *dptr = (outer_sum * outer_scale + inner_sum * inner_scale + half) >> 24; \
3069b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            dptr += dst_x_stride;
3079b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org
3089b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS
3099b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (;x < border - 16; x += 16) {
3109b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
3119b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
3129b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
3139b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
3149b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
3159b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
3169b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
3179b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
3189b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
3199b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
3209b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
3219b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
3229b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
3239b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
3249b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
3259b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
3269b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        }
3279b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif
3289b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org
3299b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (;x < border; x++) {
3309b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            LEFT_BORDER_ITER
3319b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        }
3329b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef LEFT_BORDER_ITER
3339b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (int x = width; x < diameter; ++x) {
3344a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org            *dptr = (outer_sum * outer_scale + inner_sum * inner_scale + half) >> 24;
3359b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            dptr += dst_x_stride;
3369b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        }
3379b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        x = diameter;
3389b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org
3399b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define CENTER_ITER \
3409b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            inner_sum = outer_sum - *left; \
3419b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            outer_sum += *right++; \
3424a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org            *dptr = (outer_sum * outer_scale + inner_sum * inner_scale + half) >> 24; \
3439b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            dptr += dst_x_stride; \
3449b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            outer_sum -= *left++;
3459b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org
3469b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS
3479b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (; x < width - 16; x += 16) {
3489b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
3499b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
3509b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
3519b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
3529b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
3539b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
3549b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
3559b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
3569b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
3579b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
3589b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
3599b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
3609b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
3619b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
3629b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
3639b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
3649b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        }
3659b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif
3669b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (; x < width; ++x) {
3679b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            CENTER_ITER
3689b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        }
3699b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef CENTER_ITER
3709b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org
3719b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        #define RIGHT_BORDER_ITER \
3729b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            inner_sum = outer_sum - *left++; \
3734a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org            *dptr = (outer_sum * outer_scale + inner_sum * inner_scale + half) >> 24; \
3749b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            dptr += dst_x_stride; \
3759b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            outer_sum = inner_sum;
3769b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org
3779b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        x = 0;
3789b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS
3799b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (; x < border - 16; x += 16) {
3809b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
3819b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
3829b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
3839b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
3849b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
3859b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
3869b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
3879b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
3889b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
3899b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
3909b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
3919b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
3929b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
3939b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
3949b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
3959b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
3969b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        }
3979b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif
3989b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        for (; x < border; x++) {
3999b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org            RIGHT_BORDER_ITER
4009b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        }
4019b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef RIGHT_BORDER_ITER
4029b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org        SkASSERT(outer_sum == 0 && inner_sum == 0);
4039b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    }
4049b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org    return new_width;
4059b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org}
4069b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org
407c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.orgstatic void get_adjusted_radii(SkScalar passRadius, int *loRadius, int *hiRadius)
408c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org{
409c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org    *loRadius = *hiRadius = SkScalarCeil(passRadius);
410c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org    if (SkIntToScalar(*hiRadius) - passRadius > SkFloatToScalar(0.5f)) {
411c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org        *loRadius = *hiRadius - 1;
412c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org    }
413c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org}
414c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org
41501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com// Unrolling the integer blur kernel seems to give us a ~15% speedup on Windows,
41601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com// breakeven on Mac, and ~15% slowdown on Linux.
41701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com// Reading a word at a time when bulding the sum buffer seems to give
41801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com// us no appreciable speedup on Windows or Mac, and 2% slowdown on Linux.
419054ff1efa4f9187ce7fd20aaf3aed7cecf14e12btomhudson@google.com#if defined(SK_BUILD_FOR_WIN32)
42001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#define UNROLL_KERNEL_LOOP 1
42101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#endif
4228a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
4234560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com/** The sum buffer is an array of u32 to hold the accumulated sum of all of the
4244560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    src values at their position, plus all values above and to the left.
4254560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    When we sample into this buffer, we need an initial row and column of 0s,
4264560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    so we have an index correspondence as follows:
427fbfcd5602128ec010c82cb733c9cdc0a3254f9f3rmistry@google.com
4284560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    src[i, j] == sum[i+1, j+1]
4294560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    sum[0, j] == sum[i, 0] == 0
430fbfcd5602128ec010c82cb733c9cdc0a3254f9f3rmistry@google.com
4314560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    We assume that the sum buffer's stride == its width
4324560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com */
43303016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.comstatic void build_sum_buffer(uint32_t sum[], int srcW, int srcH,
43403016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com                             const uint8_t src[], int srcRB) {
4354560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    int sumW = srcW + 1;
4364560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com
4374560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    SkASSERT(srcRB >= srcW);
4388a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    // mod srcRB so we can apply it after each row
4394560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    srcRB -= srcW;
4408a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
4418a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    int x, y;
4428a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
4434560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    // zero out the top row and column
4444560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    memset(sum, 0, sumW * sizeof(sum[0]));
4454560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    sum += sumW;
4464560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com
4478a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    // special case first row
4488a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    uint32_t X = 0;
4494560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    *sum++ = 0; // initialze the first column to 0
45003016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com    for (x = srcW - 1; x >= 0; --x) {
4518a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        X = *src++ + X;
4524560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com        *sum++ = X;
4538a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    }
4548a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    src += srcRB;
4558a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
4568a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    // now do the rest of the rows
45703016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com    for (y = srcH - 1; y > 0; --y) {
4588a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        uint32_t L = 0;
4598a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        uint32_t C = 0;
4604560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com        *sum++ = 0; // initialze the first column to 0
46101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com
46201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        for (x = srcW - 1; !SkIsAlign4((intptr_t) src) && x >= 0; x--) {
46301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            uint32_t T = sum[-sumW];
46401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            X = *src++ + L + T - C;
46501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            *sum++ = X;
46601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            L = X;
46701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            C = T;
46801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        }
46901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com
47001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        for (; x >= 4; x-=4) {
47101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            uint32_t T = sum[-sumW];
47201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            X = *src++ + L + T - C;
47301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            *sum++ = X;
47401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            L = X;
47501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            C = T;
47601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            T = sum[-sumW];
47701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            X = *src++ + L + T - C;
47801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            *sum++ = X;
47901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            L = X;
48001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            C = T;
48101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            T = sum[-sumW];
48201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            X = *src++ + L + T - C;
48301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            *sum++ = X;
48401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            L = X;
48501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            C = T;
48601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            T = sum[-sumW];
48701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            X = *src++ + L + T - C;
48801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            *sum++ = X;
48901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            L = X;
49001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            C = T;
49101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        }
49201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com
49301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        for (; x >= 0; --x) {
4944560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com            uint32_t T = sum[-sumW];
4958a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            X = *src++ + L + T - C;
4964560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com            *sum++ = X;
4978a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            L = X;
4988a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            C = T;
4998a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        }
5008a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        src += srcRB;
5018a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    }
5028a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com}
5038a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
50403016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com/**
5058caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * This is the path for apply_kernel() to be taken when the kernel
5068caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * is wider than the source image.
5078caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com */
5088caac6447dd68655b57dfe876626a9733b191416tomhudson@google.comstatic void kernel_clamped(uint8_t dst[], int rx, int ry, const uint32_t sum[],
5098caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                           int sw, int sh) {
5108caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    SkASSERT(2*rx > sw);
5118caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5128caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    uint32_t scale = (1 << 24) / ((2*rx + 1)*(2*ry + 1));
5138caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5148caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    int sumStride = sw + 1;
5158caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5168caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    int dw = sw + 2*rx;
5178caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    int dh = sh + 2*ry;
5188caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5198caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    int prev_y = -2*ry;
5208caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    int next_y = 1;
5218caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5228caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    for (int y = 0; y < dh; y++) {
5238caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        int py = SkClampPos(prev_y) * sumStride;
5248caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        int ny = SkFastMin32(next_y, sh) * sumStride;
5258caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5268caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        int prev_x = -2*rx;
5278caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        int next_x = 1;
5288caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5298caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        for (int x = 0; x < dw; x++) {
5308caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int px = SkClampPos(prev_x);
5318caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int nx = SkFastMin32(next_x, sw);
5328caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5338caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            uint32_t tmp = sum[px+py] + sum[nx+ny] - sum[nx+py] - sum[px+ny];
5348caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            *dst++ = SkToU8(tmp * scale >> 24);
5358caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5368caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            prev_x += 1;
5378caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            next_x += 1;
5388caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        }
5398caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5408caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        prev_y += 1;
5418caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        next_y += 1;
5428caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    }
5438caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com}
5448caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com/**
54503016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com *  sw and sh are the width and height of the src. Since the sum buffer
54603016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com *  matches that, but has an extra row and col at the beginning (with zeros),
54703016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com *  we can just use sw and sh as our "max" values for pinning coordinates
54803016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com *  when sampling into sum[][]
5498caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *
5508caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *  The inner loop is conceptually simple; we break it into several sections
5518caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *  to improve performance. Here's the original version:
5528caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        for (int x = 0; x < dw; x++) {
5538caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int px = SkClampPos(prev_x);
5548caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int nx = SkFastMin32(next_x, sw);
5558caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5568caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            uint32_t tmp = sum[px+py] + sum[nx+ny] - sum[nx+py] - sum[px+ny];
5578caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            *dst++ = SkToU8(tmp * scale >> 24);
5588caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5598caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            prev_x += 1;
5608caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            next_x += 1;
5618caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        }
56201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *  The sections are:
56301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *     left-hand section, where prev_x is clamped to 0
56401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *     center section, where neither prev_x nor next_x is clamped
56501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *     right-hand section, where next_x is clamped to sw
56601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *  On some operating systems, the center section is unrolled for additional
56701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *  speedup.
5688caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com*/
5694560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.comstatic void apply_kernel(uint8_t dst[], int rx, int ry, const uint32_t sum[],
5704560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com                         int sw, int sh) {
5718caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    if (2*rx > sw) {
5728caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        kernel_clamped(dst, rx, ry, sum, sw, sh);
5738caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        return;
5748caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    }
5758caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5768a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    uint32_t scale = (1 << 24) / ((2*rx + 1)*(2*ry + 1));
5778a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
5784560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    int sumStride = sw + 1;
5798a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
5808a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    int dw = sw + 2*rx;
5818a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    int dh = sh + 2*ry;
5828a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
5834560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    int prev_y = -2*ry;
5844560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    int next_y = 1;
5858a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
5868caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    SkASSERT(2*rx <= dw - 2*rx);
5878caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5884560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    for (int y = 0; y < dh; y++) {
5894560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com        int py = SkClampPos(prev_y) * sumStride;
5904560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com        int ny = SkFastMin32(next_y, sh) * sumStride;
5918a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
5924560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com        int prev_x = -2*rx;
5934560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com        int next_x = 1;
5948caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        int x = 0;
5958caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
5968caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        for (; x < 2*rx; x++) {
5978caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            SkASSERT(prev_x <= 0);
5988caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            SkASSERT(next_x <= sw);
5998caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
6008caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int px = 0;
6018caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int nx = next_x;
6028caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
6038caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            uint32_t tmp = sum[px+py] + sum[nx+ny] - sum[nx+py] - sum[px+ny];
6048caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            *dst++ = SkToU8(tmp * scale >> 24);
6058caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
6068caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            prev_x += 1;
6078caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            next_x += 1;
6088caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        }
6098caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
61001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        int i0 = prev_x + py;
61101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        int i1 = next_x + ny;
61201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        int i2 = next_x + py;
61301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        int i3 = prev_x + ny;
61401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com
61501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#if UNROLL_KERNEL_LOOP
61601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        for (; x < dw - 2*rx - 4; x += 4) {
6178caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            SkASSERT(prev_x >= 0);
6188caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            SkASSERT(next_x <= sw);
6198caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
62001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            uint32_t tmp = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++];
62101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            *dst++ = SkToU8(tmp * scale >> 24);
62201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            tmp = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++];
62301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            *dst++ = SkToU8(tmp * scale >> 24);
62401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            tmp = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++];
62501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            *dst++ = SkToU8(tmp * scale >> 24);
62601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            tmp = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++];
62701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            *dst++ = SkToU8(tmp * scale >> 24);
6288caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
62901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            prev_x += 4;
63001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            next_x += 4;
63101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        }
63201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#endif
63301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com
63401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        for (; x < dw - 2*rx; x++) {
63501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            SkASSERT(prev_x >= 0);
63601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            SkASSERT(next_x <= sw);
63701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com
63801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            uint32_t tmp = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++];
6398caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            *dst++ = SkToU8(tmp * scale >> 24);
6408caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
6418caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            prev_x += 1;
6428caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            next_x += 1;
6438caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        }
6448caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
6458caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        for (; x < dw; x++) {
6468caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            SkASSERT(prev_x >= 0);
6478caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            SkASSERT(next_x > sw);
6488caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
6498caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int px = prev_x;
6508caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int nx = sw;
6518caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
6528caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            uint32_t tmp = sum[px+py] + sum[nx+ny] - sum[nx+py] - sum[px+ny];
6538caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            *dst++ = SkToU8(tmp * scale >> 24);
6548caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
6558caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            prev_x += 1;
6568caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            next_x += 1;
6578caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        }
6588caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
6598caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        prev_y += 1;
6608caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        next_y += 1;
6618caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    }
6628caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com}
6638caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
6648caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com/**
6658caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * This is the path for apply_kernel_interp() to be taken when the kernel
6668caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * is wider than the source image.
6678caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com */
6688caac6447dd68655b57dfe876626a9733b191416tomhudson@google.comstatic void kernel_interp_clamped(uint8_t dst[], int rx, int ry,
6698caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                const uint32_t sum[], int sw, int sh, U8CPU outer_weight) {
6708caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    SkASSERT(2*rx > sw);
6718caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
6728caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    int inner_weight = 255 - outer_weight;
6738caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
6748caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    // round these guys up if they're bigger than 127
6758caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    outer_weight += outer_weight >> 7;
6768caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    inner_weight += inner_weight >> 7;
6778caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
6788caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    uint32_t outer_scale = (outer_weight << 16) / ((2*rx + 1)*(2*ry + 1));
6798caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    uint32_t inner_scale = (inner_weight << 16) / ((2*rx - 1)*(2*ry - 1));
6808caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
6818caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    int sumStride = sw + 1;
6828caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
6838caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    int dw = sw + 2*rx;
6848caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    int dh = sh + 2*ry;
6858caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
6868caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    int prev_y = -2*ry;
6878caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    int next_y = 1;
6888caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
6898caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    for (int y = 0; y < dh; y++) {
6908caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        int py = SkClampPos(prev_y) * sumStride;
6918caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        int ny = SkFastMin32(next_y, sh) * sumStride;
6928caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
6938caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        int ipy = SkClampPos(prev_y + 1) * sumStride;
6948caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        int iny = SkClampMax(next_y - 1, sh) * sumStride;
6958caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
6968caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        int prev_x = -2*rx;
6978caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        int next_x = 1;
6988a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
6994560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com        for (int x = 0; x < dw; x++) {
7008a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            int px = SkClampPos(prev_x);
7018a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            int nx = SkFastMin32(next_x, sw);
7028a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
7038caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int ipx = SkClampPos(prev_x + 1);
7048caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int inx = SkClampMax(next_x - 1, sw);
7058caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
7068caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            uint32_t outer_sum = sum[px+py] + sum[nx+ny]
7078caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                               - sum[nx+py] - sum[px+ny];
7088caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            uint32_t inner_sum = sum[ipx+ipy] + sum[inx+iny]
7098caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                               - sum[inx+ipy] - sum[ipx+iny];
7108caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            *dst++ = SkToU8((outer_sum * outer_scale
7118caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                           + inner_sum * inner_scale) >> 24);
7128a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
7138a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            prev_x += 1;
7148a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            next_x += 1;
7158a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        }
7168a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        prev_y += 1;
7178a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        next_y += 1;
7188a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    }
7198a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com}
7208a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
72103016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com/**
72203016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com *  sw and sh are the width and height of the src. Since the sum buffer
72303016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com *  matches that, but has an extra row and col at the beginning (with zeros),
72403016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com *  we can just use sw and sh as our "max" values for pinning coordinates
72503016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com *  when sampling into sum[][]
7268caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *
7278caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *  The inner loop is conceptually simple; we break it into several variants
7288caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *  to improve performance. Here's the original version:
7298caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        for (int x = 0; x < dw; x++) {
7308caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int px = SkClampPos(prev_x);
7318caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int nx = SkFastMin32(next_x, sw);
7328caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
7338caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int ipx = SkClampPos(prev_x + 1);
7348caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int inx = SkClampMax(next_x - 1, sw);
7358caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
7368caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            uint32_t outer_sum = sum[px+py] + sum[nx+ny]
7378caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                               - sum[nx+py] - sum[px+ny];
7388caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            uint32_t inner_sum = sum[ipx+ipy] + sum[inx+iny]
7398caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                               - sum[inx+ipy] - sum[ipx+iny];
7408caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            *dst++ = SkToU8((outer_sum * outer_scale
7418caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                           + inner_sum * inner_scale) >> 24);
7428caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
7438caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            prev_x += 1;
7448caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            next_x += 1;
7458caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        }
74601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *  The sections are:
74701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *     left-hand section, where prev_x is clamped to 0
74801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *     center section, where neither prev_x nor next_x is clamped
74901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *     right-hand section, where next_x is clamped to sw
75001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *  On some operating systems, the center section is unrolled for additional
75101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *  speedup.
7528caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com*/
7534560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.comstatic void apply_kernel_interp(uint8_t dst[], int rx, int ry,
7544560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com                const uint32_t sum[], int sw, int sh, U8CPU outer_weight) {
7558a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    SkASSERT(rx > 0 && ry > 0);
7568a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    SkASSERT(outer_weight <= 255);
7578a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
7588caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    if (2*rx > sw) {
7598caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        kernel_interp_clamped(dst, rx, ry, sum, sw, sh, outer_weight);
7608caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        return;
7618caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    }
7628caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
7638a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    int inner_weight = 255 - outer_weight;
7648a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
7658a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    // round these guys up if they're bigger than 127
7668a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    outer_weight += outer_weight >> 7;
7678a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    inner_weight += inner_weight >> 7;
7688a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
7698a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    uint32_t outer_scale = (outer_weight << 16) / ((2*rx + 1)*(2*ry + 1));
7708a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    uint32_t inner_scale = (inner_weight << 16) / ((2*rx - 1)*(2*ry - 1));
7718a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
7724560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    int sumStride = sw + 1;
7738a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
7748a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    int dw = sw + 2*rx;
7758a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    int dh = sh + 2*ry;
7768a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
7774560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    int prev_y = -2*ry;
7784560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    int next_y = 1;
7798a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
7808caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com    SkASSERT(2*rx <= dw - 2*rx);
7818caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
7824560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com    for (int y = 0; y < dh; y++) {
7834560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com        int py = SkClampPos(prev_y) * sumStride;
7844560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com        int ny = SkFastMin32(next_y, sh) * sumStride;
7858a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
7864560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com        int ipy = SkClampPos(prev_y + 1) * sumStride;
7874560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com        int iny = SkClampMax(next_y - 1, sh) * sumStride;
7888a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
7894560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com        int prev_x = -2*rx;
7904560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com        int next_x = 1;
7918caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        int x = 0;
7928a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
7938caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        for (; x < 2*rx; x++) {
7948caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            SkASSERT(prev_x < 0);
7958caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            SkASSERT(next_x <= sw);
7968a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
7978caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int px = 0;
7988caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int nx = next_x;
7998caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
8008caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int ipx = 0;
8018caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int inx = next_x - 1;
8028caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
8038caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            uint32_t outer_sum = sum[px+py] + sum[nx+ny]
8048caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                               - sum[nx+py] - sum[px+ny];
8058caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            uint32_t inner_sum = sum[ipx+ipy] + sum[inx+iny]
8068caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                               - sum[inx+ipy] - sum[ipx+iny];
8078caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            *dst++ = SkToU8((outer_sum * outer_scale
8088caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                           + inner_sum * inner_scale) >> 24);
8098caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
8108caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            prev_x += 1;
8118caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            next_x += 1;
8128caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        }
8138caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
81401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        int i0 = prev_x + py;
81501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        int i1 = next_x + ny;
81601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        int i2 = next_x + py;
81701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        int i3 = prev_x + ny;
81801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        int i4 = prev_x + 1 + ipy;
81901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        int i5 = next_x - 1 + iny;
82001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        int i6 = next_x - 1 + ipy;
82101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        int i7 = prev_x + 1 + iny;
82201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com
82301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#if UNROLL_KERNEL_LOOP
82401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        for (; x < dw - 2*rx - 4; x += 4) {
8258caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            SkASSERT(prev_x >= 0);
8268caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            SkASSERT(next_x <= sw);
8278caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
82801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            uint32_t outer_sum = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++];
82901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            uint32_t inner_sum = sum[i4++] + sum[i5++] - sum[i6++] - sum[i7++];
83001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            *dst++ = SkToU8((outer_sum * outer_scale
83101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com                           + inner_sum * inner_scale) >> 24);
83201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            outer_sum = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++];
83301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            inner_sum = sum[i4++] + sum[i5++] - sum[i6++] - sum[i7++];
83401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            *dst++ = SkToU8((outer_sum * outer_scale
83501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com                           + inner_sum * inner_scale) >> 24);
83601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            outer_sum = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++];
83701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            inner_sum = sum[i4++] + sum[i5++] - sum[i6++] - sum[i7++];
83801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            *dst++ = SkToU8((outer_sum * outer_scale
83901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com                           + inner_sum * inner_scale) >> 24);
84001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            outer_sum = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++];
84101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            inner_sum = sum[i4++] + sum[i5++] - sum[i6++] - sum[i7++];
84201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            *dst++ = SkToU8((outer_sum * outer_scale
84301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com                           + inner_sum * inner_scale) >> 24);
8448caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
84501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            prev_x += 4;
84601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            next_x += 4;
84701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        }
84801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#endif
8498a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
85001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com        for (; x < dw - 2*rx; x++) {
85101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            SkASSERT(prev_x >= 0);
85201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            SkASSERT(next_x <= sw);
85301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com
85401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            uint32_t outer_sum = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++];
85501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com            uint32_t inner_sum = sum[i4++] + sum[i5++] - sum[i6++] - sum[i7++];
8568caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            *dst++ = SkToU8((outer_sum * outer_scale
8578caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                           + inner_sum * inner_scale) >> 24);
8588a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
8598a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            prev_x += 1;
8608a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            next_x += 1;
8618a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        }
8628caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
8638caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        for (; x < dw; x++) {
8648caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            SkASSERT(prev_x >= 0);
8658caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            SkASSERT(next_x > sw);
8668caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
8678caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int px = prev_x;
8688caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int nx = sw;
8698caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
8708caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int ipx = prev_x + 1;
8718caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            int inx = sw;
8728caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
8738caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            uint32_t outer_sum = sum[px+py] + sum[nx+ny]
8748caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                               - sum[nx+py] - sum[px+ny];
8758caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            uint32_t inner_sum = sum[ipx+ipy] + sum[inx+iny]
8768caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                               - sum[inx+ipy] - sum[ipx+iny];
8778caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            *dst++ = SkToU8((outer_sum * outer_scale
8788caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com                           + inner_sum * inner_scale) >> 24);
8798caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
8808caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            prev_x += 1;
8818caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com            next_x += 1;
8828caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com        }
8838caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com
8848a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        prev_y += 1;
8858a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        next_y += 1;
8868a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    }
8878a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com}
8888a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
8898a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com#include "SkColorPriv.h"
8908a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
8910e3c664250f561ec9f7107b92136517a72d03afdreed@android.comstatic void merge_src_with_blur(uint8_t dst[], int dstRB,
8920e3c664250f561ec9f7107b92136517a72d03afdreed@android.com                                const uint8_t src[], int srcRB,
8930e3c664250f561ec9f7107b92136517a72d03afdreed@android.com                                const uint8_t blur[], int blurRB,
8940e3c664250f561ec9f7107b92136517a72d03afdreed@android.com                                int sw, int sh) {
8950e3c664250f561ec9f7107b92136517a72d03afdreed@android.com    dstRB -= sw;
8960e3c664250f561ec9f7107b92136517a72d03afdreed@android.com    srcRB -= sw;
8970e3c664250f561ec9f7107b92136517a72d03afdreed@android.com    blurRB -= sw;
8980e3c664250f561ec9f7107b92136517a72d03afdreed@android.com    while (--sh >= 0) {
8990e3c664250f561ec9f7107b92136517a72d03afdreed@android.com        for (int x = sw - 1; x >= 0; --x) {
9008a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            *dst = SkToU8(SkAlphaMul(*blur, SkAlpha255To256(*src)));
9018a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            dst += 1;
9028a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            src += 1;
9038a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            blur += 1;
9048a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        }
9050e3c664250f561ec9f7107b92136517a72d03afdreed@android.com        dst += dstRB;
9060e3c664250f561ec9f7107b92136517a72d03afdreed@android.com        src += srcRB;
9070e3c664250f561ec9f7107b92136517a72d03afdreed@android.com        blur += blurRB;
9088a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    }
9098a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com}
9108a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
9118a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.comstatic void clamp_with_orig(uint8_t dst[], int dstRowBytes,
9120e3c664250f561ec9f7107b92136517a72d03afdreed@android.com                            const uint8_t src[], int srcRowBytes,
9130e3c664250f561ec9f7107b92136517a72d03afdreed@android.com                            int sw, int sh,
9144560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com                            SkBlurMask::Style style) {
9158a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    int x;
9160e3c664250f561ec9f7107b92136517a72d03afdreed@android.com    while (--sh >= 0) {
9178a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        switch (style) {
9188a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        case SkBlurMask::kSolid_Style:
9190e3c664250f561ec9f7107b92136517a72d03afdreed@android.com            for (x = sw - 1; x >= 0; --x) {
9200e3c664250f561ec9f7107b92136517a72d03afdreed@android.com                int s = *src;
9210e3c664250f561ec9f7107b92136517a72d03afdreed@android.com                int d = *dst;
9220e3c664250f561ec9f7107b92136517a72d03afdreed@android.com                *dst = SkToU8(s + d - SkMulDiv255Round(s, d));
9238a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com                dst += 1;
9248a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com                src += 1;
9258a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            }
9268a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            break;
9278a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        case SkBlurMask::kOuter_Style:
9280e3c664250f561ec9f7107b92136517a72d03afdreed@android.com            for (x = sw - 1; x >= 0; --x) {
9290e3c664250f561ec9f7107b92136517a72d03afdreed@android.com                if (*src) {
9308a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com                    *dst = SkToU8(SkAlphaMul(*dst, SkAlpha255To256(255 - *src)));
9310e3c664250f561ec9f7107b92136517a72d03afdreed@android.com                }
9328a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com                dst += 1;
9338a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com                src += 1;
9348a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            }
9358a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            break;
9368a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        default:
9370c00f21fee3f5cfa3aa7e5d46ff94cb8cf340451tomhudson@google.com            SkDEBUGFAIL("Unexpected blur style here");
9388a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            break;
9398a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        }
9408a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        dst += dstRowBytes - sw;
9410e3c664250f561ec9f7107b92136517a72d03afdreed@android.com        src += srcRowBytes - sw;
9428a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    }
9438a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com}
9448a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
94503016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com///////////////////////////////////////////////////////////////////////////////
9468a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
94733cdbdea3ddcec9323b65eace86e10557312ae9bbsalomon@google.com// we use a local function to wrap the class static method to work around
9488a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com// a bug in gcc98
9498a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.comvoid SkMask_FreeImage(uint8_t* image);
95003016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.comvoid SkMask_FreeImage(uint8_t* image) {
9518a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    SkMask::FreeImage(image);
9528a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com}
9538a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
9548a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.combool SkBlurMask::Blur(SkMask* dst, const SkMask& src,
9555af16f8d670b3ce1c7644a4737e02e2e2257614ebungeman@google.com                      SkScalar radius, Style style, Quality quality,
95671f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org                      SkIPoint* margin, bool separable)
9575af16f8d670b3ce1c7644a4737e02e2e2257614ebungeman@google.com{
95803016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com    if (src.fFormat != SkMask::kA8_Format) {
9598a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        return false;
96003016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com    }
9618a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
9624868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org    // Force high quality off for small radii (performance)
96391f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org    if (radius < SkIntToScalar(3)) {
96491f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org        quality = kLow_Quality;
96591f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org    }
9664868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org
9674868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org    // highQuality: use three box blur passes as a cheap way to approximate a Gaussian blur
96891f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org    int passCount = (kHigh_Quality == quality) ? 3 : 1;
9697c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    SkScalar passRadius = (kHigh_Quality == quality) ? SkScalarMul( radius, kBlurRadiusFudgeFactor): radius;
9704868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org
9714868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org    int rx = SkScalarCeil(passRadius);
9724868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org    int outer_weight = 255 - SkScalarRound((SkIntToScalar(rx) - passRadius) * 255);
9738a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
9748a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    SkASSERT(rx >= 0);
9758a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    SkASSERT((unsigned)outer_weight <= 255);
9760e3c664250f561ec9f7107b92136517a72d03afdreed@android.com    if (rx <= 0) {
9778a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        return false;
9780e3c664250f561ec9f7107b92136517a72d03afdreed@android.com    }
9798a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
9808a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    int ry = rx;    // only do square blur for now
9818a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
9824868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org    int padx = passCount * rx;
9834868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org    int pady = passCount * ry;
9845af16f8d670b3ce1c7644a4737e02e2e2257614ebungeman@google.com    if (margin) {
9855af16f8d670b3ce1c7644a4737e02e2e2257614ebungeman@google.com        margin->set(padx, pady);
9865af16f8d670b3ce1c7644a4737e02e2e2257614ebungeman@google.com    }
9874868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org    dst->fBounds.set(src.fBounds.fLeft - padx, src.fBounds.fTop - pady,
9884868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org        src.fBounds.fRight + padx, src.fBounds.fBottom + pady);
98949f0ff25a046d6001dc2d095b6fa3c30f0f46b6areed@android.com    dst->fRowBytes = dst->fBounds.width();
9908a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    dst->fFormat = SkMask::kA8_Format;
9918a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    dst->fImage = NULL;
9928a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
9930e3c664250f561ec9f7107b92136517a72d03afdreed@android.com    if (src.fImage) {
994543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com        size_t dstSize = dst->computeImageSize();
995543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com        if (0 == dstSize) {
996543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com            return false;   // too big to allocate, abort
997543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com        }
998543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com
9998a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        int             sw = src.fBounds.width();
10008a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        int             sh = src.fBounds.height();
10018a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        const uint8_t*  sp = src.fImage;
1002543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com        uint8_t*        dp = SkMask::AllocImage(dstSize);
10038a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
10048a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        SkAutoTCallVProc<uint8_t, SkMask_FreeImage> autoCall(dp);
10058a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
10068a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        // build the blurry destination
100771f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org        if (separable) {
100871f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org            SkAutoTMalloc<uint8_t>  tmpBuffer(dstSize);
100971f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org            uint8_t*                tp = tmpBuffer.get();
101071f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org            int w = sw, h = sh;
101171f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org
101291f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org            if (outer_weight == 255) {
1013c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org                int loRadius, hiRadius;
1014c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org                get_adjusted_radii(passRadius, &loRadius, &hiRadius);
101591f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                if (kHigh_Quality == quality) {
101691f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    // Do three X blurs, with a transpose on the final one.
101791f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    w = boxBlur(sp, src.fRowBytes, tp, loRadius, hiRadius, w, h, false);
101891f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    w = boxBlur(tp, w,             dp, hiRadius, loRadius, w, h, false);
101991f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    w = boxBlur(dp, w,             tp, hiRadius, hiRadius, w, h, true);
102091f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    // Do three Y blurs, with a transpose on the final one.
102191f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    h = boxBlur(tp, h,             dp, loRadius, hiRadius, h, w, false);
102291f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    h = boxBlur(dp, h,             tp, hiRadius, loRadius, h, w, false);
102391f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    h = boxBlur(tp, h,             dp, hiRadius, hiRadius, h, w, true);
102491f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                } else {
102591f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    w = boxBlur(sp, src.fRowBytes, tp, rx, rx, w, h, true);
102691f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    h = boxBlur(tp, h,             dp, ry, ry, h, w, true);
102791f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                }
1028908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org            } else {
102991f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                if (kHigh_Quality == quality) {
103091f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    // Do three X blurs, with a transpose on the final one.
103191f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    w = boxBlurInterp(sp, src.fRowBytes, tp, rx, w, h, false, outer_weight);
103291f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    w = boxBlurInterp(tp, w,             dp, rx, w, h, false, outer_weight);
103391f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    w = boxBlurInterp(dp, w,             tp, rx, w, h, true, outer_weight);
103491f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    // Do three Y blurs, with a transpose on the final one.
103591f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    h = boxBlurInterp(tp, h,             dp, ry, h, w, false, outer_weight);
103691f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    h = boxBlurInterp(dp, h,             tp, ry, h, w, false, outer_weight);
103791f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    h = boxBlurInterp(tp, h,             dp, ry, h, w, true, outer_weight);
103891f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                } else {
103991f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    w = boxBlurInterp(sp, src.fRowBytes, tp, rx, w, h, true, outer_weight);
104091f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                    h = boxBlurInterp(tp, h,             dp, ry, h, w, true, outer_weight);
104191f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org                }
104271f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org            }
104371f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org        } else {
104403016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com            const size_t storageW = sw + 2 * (passCount - 1) * rx + 1;
104503016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com            const size_t storageH = sh + 2 * (passCount - 1) * ry + 1;
104603016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com            SkAutoTMalloc<uint32_t> storage(storageW * storageH);
10478a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            uint32_t*               sumBuffer = storage.get();
10488a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
10494868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org            //pass1: sp is source, dp is destination
10508a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            build_sum_buffer(sumBuffer, sw, sh, sp, src.fRowBytes);
105103016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com            if (outer_weight == 255) {
10528a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com                apply_kernel(dp, rx, ry, sumBuffer, sw, sh);
105303016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com            } else {
10548a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com                apply_kernel_interp(dp, rx, ry, sumBuffer, sw, sh, outer_weight);
105503016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com            }
10564868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org
105791f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org            if (kHigh_Quality == quality) {
10584868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                //pass2: dp is source, tmpBuffer is destination
10594868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                int tmp_sw = sw + 2 * rx;
10604868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                int tmp_sh = sh + 2 * ry;
10614868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                SkAutoTMalloc<uint8_t>  tmpBuffer(dstSize);
10624868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                build_sum_buffer(sumBuffer, tmp_sw, tmp_sh, dp, tmp_sw);
10634868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                if (outer_weight == 255)
10644868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                    apply_kernel(tmpBuffer.get(), rx, ry, sumBuffer, tmp_sw, tmp_sh);
10654868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                else
106603016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com                    apply_kernel_interp(tmpBuffer.get(), rx, ry, sumBuffer,
106703016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com                                        tmp_sw, tmp_sh, outer_weight);
10684868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org
10694868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                //pass3: tmpBuffer is source, dp is destination
10704868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                tmp_sw += 2 * rx;
10714868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                tmp_sh += 2 * ry;
10724868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                build_sum_buffer(sumBuffer, tmp_sw, tmp_sh, tmpBuffer.get(), tmp_sw);
10734868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                if (outer_weight == 255)
10744868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                    apply_kernel(dp, rx, ry, sumBuffer, tmp_sw, tmp_sh);
10754868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org                else
107603016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com                    apply_kernel_interp(dp, rx, ry, sumBuffer, tmp_sw, tmp_sh,
107703016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com                                        outer_weight);
10784868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org            }
10798a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        }
10808a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
10818a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        dst->fImage = dp;
10828a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        // if need be, alloc the "real" dst (same size as src) and copy/merge
10838a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        // the blur into it (applying the src)
10840e3c664250f561ec9f7107b92136517a72d03afdreed@android.com        if (style == kInner_Style) {
10850e3c664250f561ec9f7107b92136517a72d03afdreed@android.com            // now we allocate the "real" dst, mirror the size of src
1086543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com            size_t srcSize = src.computeImageSize();
1087543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com            if (0 == srcSize) {
1088543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com                return false;   // too big to allocate, abort
1089543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com            }
1090543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com            dst->fImage = SkMask::AllocImage(srcSize);
10910e3c664250f561ec9f7107b92136517a72d03afdreed@android.com            merge_src_with_blur(dst->fImage, src.fRowBytes,
10920e3c664250f561ec9f7107b92136517a72d03afdreed@android.com                                sp, src.fRowBytes,
109303016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com                                dp + passCount * (rx + ry * dst->fRowBytes),
109403016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com                                dst->fRowBytes, sw, sh);
10958a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com            SkMask::FreeImage(dp);
10960e3c664250f561ec9f7107b92136517a72d03afdreed@android.com        } else if (style != kNormal_Style) {
109703016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com            clamp_with_orig(dp + passCount * (rx + ry * dst->fRowBytes),
109803016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com                            dst->fRowBytes, sp, src.fRowBytes, sw, sh, style);
10998a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        }
11008a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        (void)autoCall.detach();
11018a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    }
11028a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
11030e3c664250f561ec9f7107b92136517a72d03afdreed@android.com    if (style == kInner_Style) {
11048a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com        dst->fBounds = src.fBounds; // restore trimmed bounds
11050e3c664250f561ec9f7107b92136517a72d03afdreed@android.com        dst->fRowBytes = src.fRowBytes;
11068a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    }
11078a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
11088a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com    return true;
11098a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com}
11108a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com
111171f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.orgbool SkBlurMask::BlurSeparable(SkMask* dst, const SkMask& src,
111271f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org                               SkScalar radius, Style style, Quality quality,
111371f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org                               SkIPoint* margin)
111471f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org{
111571f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org    return SkBlurMask::Blur(dst, src, radius, style, quality, margin, true);
111671f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org}
111771f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org
111871f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.orgbool SkBlurMask::Blur(SkMask* dst, const SkMask& src,
111971f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org                     SkScalar radius, Style style, Quality quality,
112071f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org                     SkIPoint* margin)
112171f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org{
112271f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org    return SkBlurMask::Blur(dst, src, radius, style, quality, margin, false);
112371f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org}
11247c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
11257c7292c6071898d73dc935c3b66b9816183806f0humper@google.com/* Convolving a box with itself three times results in a piecewise
11267c7292c6071898d73dc935c3b66b9816183806f0humper@google.com   quadratic function:
11278ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
11287c7292c6071898d73dc935c3b66b9816183806f0humper@google.com   0                              x <= -1.5
11297c7292c6071898d73dc935c3b66b9816183806f0humper@google.com   9/8 + 3/2 x + 1/2 x^2   -1.5 < x <= 1.5
11307c7292c6071898d73dc935c3b66b9816183806f0humper@google.com   3/4 - x^2                -.5 < x <= .5
11317c7292c6071898d73dc935c3b66b9816183806f0humper@google.com   9/8 - 3/2 x + 1/2 x^2    0.5 < x <= 1.5
11327c7292c6071898d73dc935c3b66b9816183806f0humper@google.com   0                        1.5 < x
11338ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
11347c7292c6071898d73dc935c3b66b9816183806f0humper@google.com   To get the profile curve of the blurred step function at the rectangle
11357c7292c6071898d73dc935c3b66b9816183806f0humper@google.com   edge, we evaluate the indefinite integral, which is piecewise cubic:
11368ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
11377c7292c6071898d73dc935c3b66b9816183806f0humper@google.com   0                                        x <= -1.5
11387c7292c6071898d73dc935c3b66b9816183806f0humper@google.com   5/8 + 9/8 x + 3/4 x^2 + 1/6 x^3   -1.5 < x <= -0.5
11397c7292c6071898d73dc935c3b66b9816183806f0humper@google.com   1/2 + 3/4 x - 1/3 x^3              -.5 < x <= .5
11407c7292c6071898d73dc935c3b66b9816183806f0humper@google.com   3/8 + 9/8 x - 3/4 x^2 + 1/6 x^3     .5 < x <= 1.5
11417c7292c6071898d73dc935c3b66b9816183806f0humper@google.com   1                                  1.5 < x
11427c7292c6071898d73dc935c3b66b9816183806f0humper@google.com*/
11437c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
11447c7292c6071898d73dc935c3b66b9816183806f0humper@google.comstatic float gaussian_integral( float x ) {
11457c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    if ( x > 1.5f ) {
11467c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        return 0.0f;
11477c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    }
11487c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    if ( x < -1.5f ) {
11497c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        return 1.0f;
11507c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    }
11517c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
11527c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    float x2 = x*x;
11537c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    float x3 = x2*x;
11547c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
11559c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com    if ( x > 0.5f ) {
11569c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com        return 0.5625f - ( x3 / 6.0f - 3.0f * x2 * 0.25f + 1.125f * x);
11577c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    }
11589c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com    if ( x > -0.5f ) {
11599c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com        return 0.5f - (0.75f * x - x3 / 3.0f);
11607c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    }
11619c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com    return 0.4375f + (-x3 / 6.0f - 3.0f * x2 * 0.25f - 1.125f * x);
11627c7292c6071898d73dc935c3b66b9816183806f0humper@google.com}
11637c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
11648ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com/*
11657c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    compute_profile allocates and fills in an array of floating
11668ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com    point values between 0 and 255 for the profile signature of
11677c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    a blurred half-plane with the given blur radius.  Since we're
11687c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    going to be doing screened multiplications (i.e., 1 - (1-x)(1-y))
11697c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    all the time, we actually fill in the profile pre-inverted
11707c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    (already done 255-x).
11718ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
11727c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    The function returns the size of the array allocated for the
11738ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com    profile.  It's the responsibility of the caller to delete the
11747c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    memory returned in profile_out.
11757c7292c6071898d73dc935c3b66b9816183806f0humper@google.com*/
11767c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
11777c7292c6071898d73dc935c3b66b9816183806f0humper@google.comstatic int compute_profile( SkScalar radius, unsigned int **profile_out ) {
11789c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com    int size = SkScalarFloorToInt(radius * 3 + 1);
11797c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    int center = size >> 1;
11807c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
118133cdbdea3ddcec9323b65eace86e10557312ae9bbsalomon@google.com    unsigned int *profile = SkNEW_ARRAY(unsigned int, size);
11827c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
11837c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    float invr = 1.0f/radius;
11847c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
11857c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    profile[0] = 255;
11867c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    for (int x = 1 ; x < size ; x++) {
11877c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        float scaled_x = ( center - x ) * invr;
11887c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        float gi = gaussian_integral( scaled_x );
11897c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        profile[x] = 255 - (uint8_t) ( 255.f * gi );
11907c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    }
11917c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
11927c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    *profile_out = profile;
11937c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    return size;
11947c7292c6071898d73dc935c3b66b9816183806f0humper@google.com}
11957c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
11968ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com// TODO MAYBE: Maintain a profile cache to avoid recomputing this for
11977c7292c6071898d73dc935c3b66b9816183806f0humper@google.com// commonly used radii.  Consider baking some of the most common blur radii
11987c7292c6071898d73dc935c3b66b9816183806f0humper@google.com// directly in as static data?
11997c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
12007c7292c6071898d73dc935c3b66b9816183806f0humper@google.com// Implementation adapted from Michael Herf's approach:
12017c7292c6071898d73dc935c3b66b9816183806f0humper@google.com// http://stereopsis.com/shadowrect/
12027c7292c6071898d73dc935c3b66b9816183806f0humper@google.com
12037c7292c6071898d73dc935c3b66b9816183806f0humper@google.combool SkBlurMask::BlurRect(SkMask *dst, const SkRect &src,
12047c7292c6071898d73dc935c3b66b9816183806f0humper@google.com                          SkScalar provided_radius, Style style, Quality quality,
12057c7292c6071898d73dc935c3b66b9816183806f0humper@google.com                          SkIPoint *margin) {
12067c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    int profile_size;
12077c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    unsigned int *profile;
12088ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
12098ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
12107c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    float radius = SkScalarToFloat( SkScalarMul( provided_radius, kBlurRadiusFudgeFactor ) );
12118ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
12127c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    profile_size = compute_profile( radius, &profile );
121333cdbdea3ddcec9323b65eace86e10557312ae9bbsalomon@google.com    SkAutoTDeleteArray<unsigned int> ada(profile);
12148ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
12157c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    int pad = (int) (radius * 1.5f + 1);
12167c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    if (margin) {
12177c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        margin->set( pad, pad );
12187c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    }
12199c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com    dst->fBounds = SkIRect::MakeWH(SkScalarFloorToInt(src.width()), SkScalarFloorToInt(src.height()));
12207c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    dst->fBounds.outset(pad, pad);
12218ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
12227c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    dst->fRowBytes = dst->fBounds.width();
12237c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    dst->fFormat = SkMask::kA8_Format;
12247c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    dst->fImage = NULL;
12258ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
12267c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    size_t dstSize = dst->computeImageSize();
12277c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    if (0 == dstSize) {
12287c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        return false;   // too big to allocate, abort
12297c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    }
12308ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
12319c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com    int             sw = SkScalarFloorToInt(src.width());
12329c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com    int             sh = SkScalarFloorToInt(src.height());
12338ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
12347c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    uint8_t*        dp = SkMask::AllocImage(dstSize);
12358ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
12367c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    dst->fImage = dp;
12378ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
12387c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    int dst_height = dst->fBounds.height();
12397c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    int dst_width = dst->fBounds.width();
12408ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
12417c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    // nearest odd number less than the profile size represents the center
12427c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    // of the (2x scaled) profile
12437c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    int center = ( profile_size & ~1 ) - 1;
12448ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
12457c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    int w = sw - center;
12467c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    int h = sh - center;
12478ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
12487c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    uint8_t *outptr = dp;
12498ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
12507c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    for (int y = 0 ; y < dst_height ; y++)
12517c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    {
12527c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        // time to fill in a scanline of the blurry rectangle.
12537c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        // to avoid floating point math, everything is multiplied by
12547c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        // 2 where needed.  This keeps things nice and integer-oriented.
12558ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
12567c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        int dy = abs((y << 1) - dst_height) - h; // how far are we from the original edge?
12577c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        int oy = dy >> 1;
12587c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        if (oy < 0) oy = 0;
12598ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
12607c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        unsigned int profile_y = profile[oy];
12618ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
12627c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        for (int x = 0 ; x < (dst_width << 1) ; x += 2) {
12637c7292c6071898d73dc935c3b66b9816183806f0humper@google.com            int dx = abs( x - dst_width ) - w;
12647c7292c6071898d73dc935c3b66b9816183806f0humper@google.com            int ox = dx >> 1;
12657c7292c6071898d73dc935c3b66b9816183806f0humper@google.com            if (ox < 0) ox = 0;
12668ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
12677c7292c6071898d73dc935c3b66b9816183806f0humper@google.com            unsigned int maskval = SkMulDiv255Round(profile[ox], profile_y);
12688ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
12697c7292c6071898d73dc935c3b66b9816183806f0humper@google.com            *(outptr++) = maskval;
12707c7292c6071898d73dc935c3b66b9816183806f0humper@google.com        }
12717c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    }
12728ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com
12737c7292c6071898d73dc935c3b66b9816183806f0humper@google.com    return true;
12747c7292c6071898d73dc935c3b66b9816183806f0humper@google.com}
1275