SkBlurMask.cpp revision 9c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254
1ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com 2ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com/* 3ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com * Copyright 2006 The Android Open Source Project 4ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com * 5ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com * Use of this source code is governed by a BSD-style license that can be 6ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com * found in the LICENSE file. 7ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com */ 8ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com 98a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 108a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com#include "SkBlurMask.h" 11889bd8bd7f604acae0a6303365bc82c06da1e6f3tomhudson@google.com#include "SkMath.h" 128a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com#include "SkTemplates.h" 1301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#include "SkEndian.h" 1401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com 158ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com// scale factor for the blur radius to match the behavior of the all existing blur 167c7292c6071898d73dc935c3b66b9816183806f0humper@google.com// code (both on the CPU and the GPU). This magic constant is 1/sqrt(3). 177c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 188ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com// TODO: get rid of this fudge factor and move any required fudging up into 197c7292c6071898d73dc935c3b66b9816183806f0humper@google.com// the calling library 207c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 217c7292c6071898d73dc935c3b66b9816183806f0humper@google.com#define kBlurRadiusFudgeFactor SkFloatToScalar( .57735f ) 227c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 239b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define UNROLL_SEPARABLE_LOOPS 249b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org 25908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org/** 26908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org * This function performs a box blur in X, of the given radius. If the 27884e60be30e20f38b3466a4697081187d2f1f814skia.committer@gmail.com * "transpose" parameter is true, it will transpose the pixels on write, 28908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org * such that X and Y are swapped. Reads are always performed from contiguous 29908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org * memory in X, for speed. The destination buffer (dst) must be at least 309b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org * (width + leftRadius + rightRadius) * height bytes in size. 31908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org */ 32908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.orgstatic int boxBlur(const uint8_t* src, int src_y_stride, uint8_t* dst, 33c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org int leftRadius, int rightRadius, int width, int height, 34c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org bool transpose) 3571f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org{ 369b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org int diameter = leftRadius + rightRadius; 379b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org int kernelSize = diameter + 1; 389b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org int border = SkMin32(width, diameter); 3971f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org uint32_t scale = (1 << 24) / kernelSize; 40c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org int new_width = width + SkMax32(leftRadius, rightRadius) * 2; 41908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org int dst_x_stride = transpose ? height : 1; 42908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org int dst_y_stride = transpose ? 1 : new_width; 4371f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org for (int y = 0; y < height; ++y) { 4471f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org int sum = 0; 45908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org uint8_t* dptr = dst + y * dst_y_stride; 46908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org const uint8_t* right = src + y * src_y_stride; 47908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org const uint8_t* left = right; 48336b4da6b0d20f27f9980b03415354a2f0698e18senorblanco@chromium.org for (int x = 0; x < rightRadius - leftRadius; x++) { 49336b4da6b0d20f27f9980b03415354a2f0698e18senorblanco@chromium.org *dptr = 0; 50336b4da6b0d20f27f9980b03415354a2f0698e18senorblanco@chromium.org dptr += dst_x_stride; 51c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org } 529b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define LEFT_BORDER_ITER \ 539b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org sum += *right++; \ 549b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org *dptr = (sum * scale) >> 24; \ 55908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org dptr += dst_x_stride; 569b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org 579b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org int x = 0; 589b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS 599b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (; x < border - 16; x += 16) { 609b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 619b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 629b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 639b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 649b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 659b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 669b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 679b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 689b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 699b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 709b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 719b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 729b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 739b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 749b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 759b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 7671f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org } 779b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif 789b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (; x < border; ++x) { 799b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 809b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org } 819b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef LEFT_BORDER_ITER 829b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define TRIVIAL_ITER \ 839b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org *dptr = (sum * scale) >> 24; \ 84908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org dptr += dst_x_stride; 859b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org x = width; 869b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS 879b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (; x < diameter - 16; x += 16) { 889b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 899b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 909b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 919b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 929b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 939b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 949b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 959b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 969b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 979b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 989b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 999b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 1009b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 1019b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 1029b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 1039b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 1049b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org } 1059b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif 1069b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (; x < diameter; ++x) { 1079b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 10871f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org } 1099b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef TRIVIAL_ITER 1109b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define CENTER_ITER \ 1119b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org sum += *right++; \ 1129b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org *dptr = (sum * scale) >> 24; \ 1139b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org sum -= *left++; \ 114908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org dptr += dst_x_stride; 1159b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org 1169b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org x = diameter; 1179b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS 1189b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (; x < width - 16; x += 16) { 1199b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1209b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1219b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1229b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1239b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1249b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1259b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1269b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1279b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1289b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1299b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1309b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1319b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1329b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1339b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1349b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1359b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org } 1369b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif 1379b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (; x < width; ++x) { 1389b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 13971f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org } 1409b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef CENTER_ITER 1419b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define RIGHT_BORDER_ITER \ 1429b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org *dptr = (sum * scale) >> 24; \ 1439b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org sum -= *left++; \ 144908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org dptr += dst_x_stride; 1459b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org 1469b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org x = 0; 1479b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS 1489b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (; x < border - 16; x += 16) { 1499b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 1509b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 1519b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 1529b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 1539b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 1549b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 1559b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 1569b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 1579b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 1589b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 1599b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 1609b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 1619b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 1629b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 1639b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 1649b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 1659b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org } 1669b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif 1679b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (; x < border; ++x) { 1689b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 16971f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org } 1709b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef RIGHT_BORDER_ITER 171336b4da6b0d20f27f9980b03415354a2f0698e18senorblanco@chromium.org for (int x = 0; x < leftRadius - rightRadius; x++) { 172336b4da6b0d20f27f9980b03415354a2f0698e18senorblanco@chromium.org *dptr = 0; 173336b4da6b0d20f27f9980b03415354a2f0698e18senorblanco@chromium.org dptr += dst_x_stride; 174c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org } 17571f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org SkASSERT(sum == 0); 17671f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org } 177908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org return new_width; 17871f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org} 17971f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org 1809b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org/** 1819b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org * This variant of the box blur handles blurring of non-integer radii. It 1829b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org * keeps two running sums: an outer sum for the rounded-up kernel radius, and 1839b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org * an inner sum for the rounded-down kernel radius. For each pixel, it linearly 1849b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org * interpolates between them. In float this would be: 1859b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org * outer_weight * outer_sum / kernelSize + 1869b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org * (1.0 - outer_weight) * innerSum / (kernelSize - 2) 1879b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org */ 1889b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.orgstatic int boxBlurInterp(const uint8_t* src, int src_y_stride, uint8_t* dst, 1899b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org int radius, int width, int height, 1909b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org bool transpose, uint8_t outer_weight) 1919b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org{ 1929b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org int diameter = radius * 2; 1939b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org int kernelSize = diameter + 1; 1949b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org int border = SkMin32(width, diameter); 1959b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org int inner_weight = 255 - outer_weight; 1969b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org outer_weight += outer_weight >> 7; 1979b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org inner_weight += inner_weight >> 7; 1989b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org uint32_t outer_scale = (outer_weight << 16) / kernelSize; 1999b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org uint32_t inner_scale = (inner_weight << 16) / (kernelSize - 2); 2009b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org int new_width = width + diameter; 2019b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org int dst_x_stride = transpose ? height : 1; 2029b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org int dst_y_stride = transpose ? 1 : new_width; 2039b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (int y = 0; y < height; ++y) { 2049b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org int outer_sum = 0, inner_sum = 0; 2059b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org uint8_t* dptr = dst + y * dst_y_stride; 2069b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org const uint8_t* right = src + y * src_y_stride; 2079b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org const uint8_t* left = right; 2089b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org int x = 0; 2099b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org 2109b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define LEFT_BORDER_ITER \ 2119b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org inner_sum = outer_sum; \ 2129b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org outer_sum += *right++; \ 2139b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org *dptr = (outer_sum * outer_scale + inner_sum * inner_scale) >> 24; \ 2149b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org dptr += dst_x_stride; 2159b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org 2169b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS 2179b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (;x < border - 16; x += 16) { 2189b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 2199b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 2209b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 2219b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 2229b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 2239b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 2249b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 2259b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 2269b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 2279b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 2289b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 2299b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 2309b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 2319b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 2329b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 2339b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 2349b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org } 2359b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif 2369b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org 2379b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (;x < border; x++) { 2389b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 2399b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org } 2409b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef LEFT_BORDER_ITER 2419b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (int x = width; x < diameter; ++x) { 2429b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org *dptr = (outer_sum * outer_scale + inner_sum * inner_scale) >> 24; 2439b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org dptr += dst_x_stride; 2449b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org } 2459b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org x = diameter; 2469b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org 2479b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define CENTER_ITER \ 2489b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org inner_sum = outer_sum - *left; \ 2499b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org outer_sum += *right++; \ 2509b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org *dptr = (outer_sum * outer_scale + inner_sum * inner_scale) >> 24; \ 2519b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org dptr += dst_x_stride; \ 2529b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org outer_sum -= *left++; 2539b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org 2549b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS 2559b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (; x < width - 16; x += 16) { 2569b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 2579b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 2589b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 2599b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 2609b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 2619b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 2629b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 2639b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 2649b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 2659b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 2669b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 2679b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 2689b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 2699b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 2709b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 2719b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 2729b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org } 2739b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif 2749b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (; x < width; ++x) { 2759b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 2769b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org } 2779b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef CENTER_ITER 2789b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org 2799b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org #define RIGHT_BORDER_ITER \ 2809b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org inner_sum = outer_sum - *left++; \ 2819b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org *dptr = (outer_sum * outer_scale + inner_sum * inner_scale) >> 24; \ 2829b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org dptr += dst_x_stride; \ 2839b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org outer_sum = inner_sum; 2849b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org 2859b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org x = 0; 2869b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS 2879b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (; x < border - 16; x += 16) { 2889b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 2899b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 2909b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 2919b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 2929b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 2939b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 2949b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 2959b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 2969b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 2979b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 2989b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 2999b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 3009b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 3019b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 3029b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 3039b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 3049b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org } 3059b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif 3069b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (; x < border; x++) { 3079b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 3089b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org } 3099b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef RIGHT_BORDER_ITER 3109b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org SkASSERT(outer_sum == 0 && inner_sum == 0); 3119b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org } 3129b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org return new_width; 3139b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org} 3149b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org 315c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.orgstatic void get_adjusted_radii(SkScalar passRadius, int *loRadius, int *hiRadius) 316c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org{ 317c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org *loRadius = *hiRadius = SkScalarCeil(passRadius); 318c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org if (SkIntToScalar(*hiRadius) - passRadius > SkFloatToScalar(0.5f)) { 319c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org *loRadius = *hiRadius - 1; 320c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org } 321c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org} 322c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org 32301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com// Unrolling the integer blur kernel seems to give us a ~15% speedup on Windows, 32401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com// breakeven on Mac, and ~15% slowdown on Linux. 32501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com// Reading a word at a time when bulding the sum buffer seems to give 32601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com// us no appreciable speedup on Windows or Mac, and 2% slowdown on Linux. 327054ff1efa4f9187ce7fd20aaf3aed7cecf14e12btomhudson@google.com#if defined(SK_BUILD_FOR_WIN32) 32801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#define UNROLL_KERNEL_LOOP 1 32901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#endif 3308a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 3314560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com/** The sum buffer is an array of u32 to hold the accumulated sum of all of the 3324560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com src values at their position, plus all values above and to the left. 3334560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com When we sample into this buffer, we need an initial row and column of 0s, 3344560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com so we have an index correspondence as follows: 335fbfcd5602128ec010c82cb733c9cdc0a3254f9f3rmistry@google.com 3364560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com src[i, j] == sum[i+1, j+1] 3374560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com sum[0, j] == sum[i, 0] == 0 338fbfcd5602128ec010c82cb733c9cdc0a3254f9f3rmistry@google.com 3394560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com We assume that the sum buffer's stride == its width 3404560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com */ 34103016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.comstatic void build_sum_buffer(uint32_t sum[], int srcW, int srcH, 34203016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com const uint8_t src[], int srcRB) { 3434560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int sumW = srcW + 1; 3444560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com 3454560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com SkASSERT(srcRB >= srcW); 3468a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com // mod srcRB so we can apply it after each row 3474560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com srcRB -= srcW; 3488a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 3498a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com int x, y; 3508a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 3514560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com // zero out the top row and column 3524560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com memset(sum, 0, sumW * sizeof(sum[0])); 3534560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com sum += sumW; 3544560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com 3558a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com // special case first row 3568a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com uint32_t X = 0; 3574560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com *sum++ = 0; // initialze the first column to 0 35803016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com for (x = srcW - 1; x >= 0; --x) { 3598a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com X = *src++ + X; 3604560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com *sum++ = X; 3618a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 3628a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com src += srcRB; 3638a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 3648a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com // now do the rest of the rows 36503016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com for (y = srcH - 1; y > 0; --y) { 3668a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com uint32_t L = 0; 3678a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com uint32_t C = 0; 3684560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com *sum++ = 0; // initialze the first column to 0 36901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com 37001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com for (x = srcW - 1; !SkIsAlign4((intptr_t) src) && x >= 0; x--) { 37101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com uint32_t T = sum[-sumW]; 37201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com X = *src++ + L + T - C; 37301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *sum++ = X; 37401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com L = X; 37501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com C = T; 37601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com } 37701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com 37801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com for (; x >= 4; x-=4) { 37901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com uint32_t T = sum[-sumW]; 38001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com X = *src++ + L + T - C; 38101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *sum++ = X; 38201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com L = X; 38301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com C = T; 38401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com T = sum[-sumW]; 38501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com X = *src++ + L + T - C; 38601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *sum++ = X; 38701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com L = X; 38801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com C = T; 38901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com T = sum[-sumW]; 39001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com X = *src++ + L + T - C; 39101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *sum++ = X; 39201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com L = X; 39301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com C = T; 39401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com T = sum[-sumW]; 39501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com X = *src++ + L + T - C; 39601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *sum++ = X; 39701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com L = X; 39801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com C = T; 39901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com } 40001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com 40101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com for (; x >= 0; --x) { 4024560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com uint32_t T = sum[-sumW]; 4038a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com X = *src++ + L + T - C; 4044560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com *sum++ = X; 4058a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com L = X; 4068a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com C = T; 4078a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 4088a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com src += srcRB; 4098a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 4108a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com} 4118a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 41203016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com/** 4138caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * This is the path for apply_kernel() to be taken when the kernel 4148caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * is wider than the source image. 4158caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com */ 4168caac6447dd68655b57dfe876626a9733b191416tomhudson@google.comstatic void kernel_clamped(uint8_t dst[], int rx, int ry, const uint32_t sum[], 4178caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int sw, int sh) { 4188caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(2*rx > sw); 4198caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 4208caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t scale = (1 << 24) / ((2*rx + 1)*(2*ry + 1)); 4218caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 4228caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int sumStride = sw + 1; 4238caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 4248caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int dw = sw + 2*rx; 4258caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int dh = sh + 2*ry; 4268caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 4278caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int prev_y = -2*ry; 4288caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int next_y = 1; 4298caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 4308caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com for (int y = 0; y < dh; y++) { 4318caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int py = SkClampPos(prev_y) * sumStride; 4328caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int ny = SkFastMin32(next_y, sh) * sumStride; 4338caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 4348caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int prev_x = -2*rx; 4358caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int next_x = 1; 4368caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 4378caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com for (int x = 0; x < dw; x++) { 4388caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int px = SkClampPos(prev_x); 4398caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int nx = SkFastMin32(next_x, sw); 4408caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 4418caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t tmp = sum[px+py] + sum[nx+ny] - sum[nx+py] - sum[px+ny]; 4428caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *dst++ = SkToU8(tmp * scale >> 24); 4438caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 4448caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com prev_x += 1; 4458caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com next_x += 1; 4468caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com } 4478caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 4488caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com prev_y += 1; 4498caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com next_y += 1; 4508caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com } 4518caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com} 4528caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com/** 45303016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com * sw and sh are the width and height of the src. Since the sum buffer 45403016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com * matches that, but has an extra row and col at the beginning (with zeros), 45503016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com * we can just use sw and sh as our "max" values for pinning coordinates 45603016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com * when sampling into sum[][] 4578caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * 4588caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * The inner loop is conceptually simple; we break it into several sections 4598caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * to improve performance. Here's the original version: 4608caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com for (int x = 0; x < dw; x++) { 4618caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int px = SkClampPos(prev_x); 4628caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int nx = SkFastMin32(next_x, sw); 4638caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 4648caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t tmp = sum[px+py] + sum[nx+ny] - sum[nx+py] - sum[px+ny]; 4658caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *dst++ = SkToU8(tmp * scale >> 24); 4668caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 4678caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com prev_x += 1; 4688caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com next_x += 1; 4698caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com } 47001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com * The sections are: 47101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com * left-hand section, where prev_x is clamped to 0 47201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com * center section, where neither prev_x nor next_x is clamped 47301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com * right-hand section, where next_x is clamped to sw 47401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com * On some operating systems, the center section is unrolled for additional 47501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com * speedup. 4768caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com*/ 4774560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.comstatic void apply_kernel(uint8_t dst[], int rx, int ry, const uint32_t sum[], 4784560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int sw, int sh) { 4798caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com if (2*rx > sw) { 4808caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com kernel_clamped(dst, rx, ry, sum, sw, sh); 4818caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com return; 4828caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com } 4838caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 4848a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com uint32_t scale = (1 << 24) / ((2*rx + 1)*(2*ry + 1)); 4858a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 4864560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int sumStride = sw + 1; 4878a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 4888a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com int dw = sw + 2*rx; 4898a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com int dh = sh + 2*ry; 4908a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 4914560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int prev_y = -2*ry; 4924560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int next_y = 1; 4938a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 4948caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(2*rx <= dw - 2*rx); 4958caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 4964560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com for (int y = 0; y < dh; y++) { 4974560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int py = SkClampPos(prev_y) * sumStride; 4984560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int ny = SkFastMin32(next_y, sh) * sumStride; 4998a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 5004560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int prev_x = -2*rx; 5014560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int next_x = 1; 5028caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int x = 0; 5038caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5048caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com for (; x < 2*rx; x++) { 5058caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(prev_x <= 0); 5068caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(next_x <= sw); 5078caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5088caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int px = 0; 5098caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int nx = next_x; 5108caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5118caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t tmp = sum[px+py] + sum[nx+ny] - sum[nx+py] - sum[px+ny]; 5128caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *dst++ = SkToU8(tmp * scale >> 24); 5138caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5148caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com prev_x += 1; 5158caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com next_x += 1; 5168caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com } 5178caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 51801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com int i0 = prev_x + py; 51901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com int i1 = next_x + ny; 52001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com int i2 = next_x + py; 52101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com int i3 = prev_x + ny; 52201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com 52301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#if UNROLL_KERNEL_LOOP 52401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com for (; x < dw - 2*rx - 4; x += 4) { 5258caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(prev_x >= 0); 5268caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(next_x <= sw); 5278caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 52801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com uint32_t tmp = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++]; 52901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *dst++ = SkToU8(tmp * scale >> 24); 53001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com tmp = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++]; 53101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *dst++ = SkToU8(tmp * scale >> 24); 53201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com tmp = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++]; 53301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *dst++ = SkToU8(tmp * scale >> 24); 53401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com tmp = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++]; 53501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *dst++ = SkToU8(tmp * scale >> 24); 5368caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 53701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com prev_x += 4; 53801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com next_x += 4; 53901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com } 54001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#endif 54101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com 54201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com for (; x < dw - 2*rx; x++) { 54301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com SkASSERT(prev_x >= 0); 54401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com SkASSERT(next_x <= sw); 54501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com 54601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com uint32_t tmp = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++]; 5478caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *dst++ = SkToU8(tmp * scale >> 24); 5488caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5498caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com prev_x += 1; 5508caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com next_x += 1; 5518caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com } 5528caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5538caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com for (; x < dw; x++) { 5548caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(prev_x >= 0); 5558caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(next_x > sw); 5568caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5578caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int px = prev_x; 5588caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int nx = sw; 5598caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5608caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t tmp = sum[px+py] + sum[nx+ny] - sum[nx+py] - sum[px+ny]; 5618caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *dst++ = SkToU8(tmp * scale >> 24); 5628caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5638caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com prev_x += 1; 5648caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com next_x += 1; 5658caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com } 5668caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5678caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com prev_y += 1; 5688caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com next_y += 1; 5698caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com } 5708caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com} 5718caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5728caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com/** 5738caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * This is the path for apply_kernel_interp() to be taken when the kernel 5748caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * is wider than the source image. 5758caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com */ 5768caac6447dd68655b57dfe876626a9733b191416tomhudson@google.comstatic void kernel_interp_clamped(uint8_t dst[], int rx, int ry, 5778caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com const uint32_t sum[], int sw, int sh, U8CPU outer_weight) { 5788caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(2*rx > sw); 5798caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5808caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int inner_weight = 255 - outer_weight; 5818caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5828caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com // round these guys up if they're bigger than 127 5838caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com outer_weight += outer_weight >> 7; 5848caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com inner_weight += inner_weight >> 7; 5858caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5868caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t outer_scale = (outer_weight << 16) / ((2*rx + 1)*(2*ry + 1)); 5878caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t inner_scale = (inner_weight << 16) / ((2*rx - 1)*(2*ry - 1)); 5888caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5898caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int sumStride = sw + 1; 5908caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5918caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int dw = sw + 2*rx; 5928caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int dh = sh + 2*ry; 5938caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5948caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int prev_y = -2*ry; 5958caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int next_y = 1; 5968caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5978caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com for (int y = 0; y < dh; y++) { 5988caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int py = SkClampPos(prev_y) * sumStride; 5998caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int ny = SkFastMin32(next_y, sh) * sumStride; 6008caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 6018caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int ipy = SkClampPos(prev_y + 1) * sumStride; 6028caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int iny = SkClampMax(next_y - 1, sh) * sumStride; 6038caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 6048caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int prev_x = -2*rx; 6058caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int next_x = 1; 6068a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 6074560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com for (int x = 0; x < dw; x++) { 6088a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com int px = SkClampPos(prev_x); 6098a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com int nx = SkFastMin32(next_x, sw); 6108a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 6118caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int ipx = SkClampPos(prev_x + 1); 6128caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int inx = SkClampMax(next_x - 1, sw); 6138caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 6148caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t outer_sum = sum[px+py] + sum[nx+ny] 6158caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com - sum[nx+py] - sum[px+ny]; 6168caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t inner_sum = sum[ipx+ipy] + sum[inx+iny] 6178caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com - sum[inx+ipy] - sum[ipx+iny]; 6188caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *dst++ = SkToU8((outer_sum * outer_scale 6198caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com + inner_sum * inner_scale) >> 24); 6208a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 6218a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com prev_x += 1; 6228a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com next_x += 1; 6238a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 6248a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com prev_y += 1; 6258a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com next_y += 1; 6268a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 6278a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com} 6288a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 62903016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com/** 63003016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com * sw and sh are the width and height of the src. Since the sum buffer 63103016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com * matches that, but has an extra row and col at the beginning (with zeros), 63203016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com * we can just use sw and sh as our "max" values for pinning coordinates 63303016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com * when sampling into sum[][] 6348caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * 6358caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * The inner loop is conceptually simple; we break it into several variants 6368caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * to improve performance. Here's the original version: 6378caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com for (int x = 0; x < dw; x++) { 6388caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int px = SkClampPos(prev_x); 6398caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int nx = SkFastMin32(next_x, sw); 6408caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 6418caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int ipx = SkClampPos(prev_x + 1); 6428caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int inx = SkClampMax(next_x - 1, sw); 6438caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 6448caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t outer_sum = sum[px+py] + sum[nx+ny] 6458caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com - sum[nx+py] - sum[px+ny]; 6468caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t inner_sum = sum[ipx+ipy] + sum[inx+iny] 6478caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com - sum[inx+ipy] - sum[ipx+iny]; 6488caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *dst++ = SkToU8((outer_sum * outer_scale 6498caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com + inner_sum * inner_scale) >> 24); 6508caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 6518caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com prev_x += 1; 6528caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com next_x += 1; 6538caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com } 65401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com * The sections are: 65501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com * left-hand section, where prev_x is clamped to 0 65601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com * center section, where neither prev_x nor next_x is clamped 65701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com * right-hand section, where next_x is clamped to sw 65801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com * On some operating systems, the center section is unrolled for additional 65901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com * speedup. 6608caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com*/ 6614560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.comstatic void apply_kernel_interp(uint8_t dst[], int rx, int ry, 6624560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com const uint32_t sum[], int sw, int sh, U8CPU outer_weight) { 6638a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com SkASSERT(rx > 0 && ry > 0); 6648a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com SkASSERT(outer_weight <= 255); 6658a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 6668caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com if (2*rx > sw) { 6678caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com kernel_interp_clamped(dst, rx, ry, sum, sw, sh, outer_weight); 6688caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com return; 6698caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com } 6708caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 6718a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com int inner_weight = 255 - outer_weight; 6728a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 6738a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com // round these guys up if they're bigger than 127 6748a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com outer_weight += outer_weight >> 7; 6758a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com inner_weight += inner_weight >> 7; 6768a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 6778a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com uint32_t outer_scale = (outer_weight << 16) / ((2*rx + 1)*(2*ry + 1)); 6788a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com uint32_t inner_scale = (inner_weight << 16) / ((2*rx - 1)*(2*ry - 1)); 6798a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 6804560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int sumStride = sw + 1; 6818a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 6828a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com int dw = sw + 2*rx; 6838a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com int dh = sh + 2*ry; 6848a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 6854560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int prev_y = -2*ry; 6864560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int next_y = 1; 6878a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 6888caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(2*rx <= dw - 2*rx); 6898caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 6904560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com for (int y = 0; y < dh; y++) { 6914560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int py = SkClampPos(prev_y) * sumStride; 6924560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int ny = SkFastMin32(next_y, sh) * sumStride; 6938a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 6944560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int ipy = SkClampPos(prev_y + 1) * sumStride; 6954560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int iny = SkClampMax(next_y - 1, sh) * sumStride; 6968a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 6974560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int prev_x = -2*rx; 6984560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int next_x = 1; 6998caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int x = 0; 7008a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 7018caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com for (; x < 2*rx; x++) { 7028caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(prev_x < 0); 7038caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(next_x <= sw); 7048a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 7058caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int px = 0; 7068caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int nx = next_x; 7078caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 7088caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int ipx = 0; 7098caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int inx = next_x - 1; 7108caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 7118caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t outer_sum = sum[px+py] + sum[nx+ny] 7128caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com - sum[nx+py] - sum[px+ny]; 7138caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t inner_sum = sum[ipx+ipy] + sum[inx+iny] 7148caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com - sum[inx+ipy] - sum[ipx+iny]; 7158caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *dst++ = SkToU8((outer_sum * outer_scale 7168caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com + inner_sum * inner_scale) >> 24); 7178caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 7188caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com prev_x += 1; 7198caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com next_x += 1; 7208caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com } 7218caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 72201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com int i0 = prev_x + py; 72301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com int i1 = next_x + ny; 72401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com int i2 = next_x + py; 72501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com int i3 = prev_x + ny; 72601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com int i4 = prev_x + 1 + ipy; 72701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com int i5 = next_x - 1 + iny; 72801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com int i6 = next_x - 1 + ipy; 72901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com int i7 = prev_x + 1 + iny; 73001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com 73101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#if UNROLL_KERNEL_LOOP 73201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com for (; x < dw - 2*rx - 4; x += 4) { 7338caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(prev_x >= 0); 7348caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(next_x <= sw); 7358caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 73601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com uint32_t outer_sum = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++]; 73701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com uint32_t inner_sum = sum[i4++] + sum[i5++] - sum[i6++] - sum[i7++]; 73801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *dst++ = SkToU8((outer_sum * outer_scale 73901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com + inner_sum * inner_scale) >> 24); 74001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com outer_sum = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++]; 74101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com inner_sum = sum[i4++] + sum[i5++] - sum[i6++] - sum[i7++]; 74201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *dst++ = SkToU8((outer_sum * outer_scale 74301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com + inner_sum * inner_scale) >> 24); 74401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com outer_sum = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++]; 74501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com inner_sum = sum[i4++] + sum[i5++] - sum[i6++] - sum[i7++]; 74601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *dst++ = SkToU8((outer_sum * outer_scale 74701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com + inner_sum * inner_scale) >> 24); 74801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com outer_sum = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++]; 74901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com inner_sum = sum[i4++] + sum[i5++] - sum[i6++] - sum[i7++]; 75001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *dst++ = SkToU8((outer_sum * outer_scale 75101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com + inner_sum * inner_scale) >> 24); 7528caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 75301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com prev_x += 4; 75401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com next_x += 4; 75501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com } 75601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#endif 7578a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 75801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com for (; x < dw - 2*rx; x++) { 75901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com SkASSERT(prev_x >= 0); 76001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com SkASSERT(next_x <= sw); 76101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com 76201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com uint32_t outer_sum = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++]; 76301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com uint32_t inner_sum = sum[i4++] + sum[i5++] - sum[i6++] - sum[i7++]; 7648caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *dst++ = SkToU8((outer_sum * outer_scale 7658caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com + inner_sum * inner_scale) >> 24); 7668a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 7678a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com prev_x += 1; 7688a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com next_x += 1; 7698a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 7708caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 7718caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com for (; x < dw; x++) { 7728caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(prev_x >= 0); 7738caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(next_x > sw); 7748caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 7758caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int px = prev_x; 7768caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int nx = sw; 7778caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 7788caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int ipx = prev_x + 1; 7798caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int inx = sw; 7808caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 7818caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t outer_sum = sum[px+py] + sum[nx+ny] 7828caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com - sum[nx+py] - sum[px+ny]; 7838caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t inner_sum = sum[ipx+ipy] + sum[inx+iny] 7848caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com - sum[inx+ipy] - sum[ipx+iny]; 7858caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *dst++ = SkToU8((outer_sum * outer_scale 7868caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com + inner_sum * inner_scale) >> 24); 7878caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 7888caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com prev_x += 1; 7898caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com next_x += 1; 7908caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com } 7918caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 7928a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com prev_y += 1; 7938a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com next_y += 1; 7948a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 7958a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com} 7968a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 7978a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com#include "SkColorPriv.h" 7988a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 7990e3c664250f561ec9f7107b92136517a72d03afdreed@android.comstatic void merge_src_with_blur(uint8_t dst[], int dstRB, 8000e3c664250f561ec9f7107b92136517a72d03afdreed@android.com const uint8_t src[], int srcRB, 8010e3c664250f561ec9f7107b92136517a72d03afdreed@android.com const uint8_t blur[], int blurRB, 8020e3c664250f561ec9f7107b92136517a72d03afdreed@android.com int sw, int sh) { 8030e3c664250f561ec9f7107b92136517a72d03afdreed@android.com dstRB -= sw; 8040e3c664250f561ec9f7107b92136517a72d03afdreed@android.com srcRB -= sw; 8050e3c664250f561ec9f7107b92136517a72d03afdreed@android.com blurRB -= sw; 8060e3c664250f561ec9f7107b92136517a72d03afdreed@android.com while (--sh >= 0) { 8070e3c664250f561ec9f7107b92136517a72d03afdreed@android.com for (int x = sw - 1; x >= 0; --x) { 8088a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com *dst = SkToU8(SkAlphaMul(*blur, SkAlpha255To256(*src))); 8098a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com dst += 1; 8108a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com src += 1; 8118a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com blur += 1; 8128a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 8130e3c664250f561ec9f7107b92136517a72d03afdreed@android.com dst += dstRB; 8140e3c664250f561ec9f7107b92136517a72d03afdreed@android.com src += srcRB; 8150e3c664250f561ec9f7107b92136517a72d03afdreed@android.com blur += blurRB; 8168a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 8178a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com} 8188a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 8198a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.comstatic void clamp_with_orig(uint8_t dst[], int dstRowBytes, 8200e3c664250f561ec9f7107b92136517a72d03afdreed@android.com const uint8_t src[], int srcRowBytes, 8210e3c664250f561ec9f7107b92136517a72d03afdreed@android.com int sw, int sh, 8224560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com SkBlurMask::Style style) { 8238a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com int x; 8240e3c664250f561ec9f7107b92136517a72d03afdreed@android.com while (--sh >= 0) { 8258a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com switch (style) { 8268a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com case SkBlurMask::kSolid_Style: 8270e3c664250f561ec9f7107b92136517a72d03afdreed@android.com for (x = sw - 1; x >= 0; --x) { 8280e3c664250f561ec9f7107b92136517a72d03afdreed@android.com int s = *src; 8290e3c664250f561ec9f7107b92136517a72d03afdreed@android.com int d = *dst; 8300e3c664250f561ec9f7107b92136517a72d03afdreed@android.com *dst = SkToU8(s + d - SkMulDiv255Round(s, d)); 8318a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com dst += 1; 8328a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com src += 1; 8338a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 8348a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com break; 8358a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com case SkBlurMask::kOuter_Style: 8360e3c664250f561ec9f7107b92136517a72d03afdreed@android.com for (x = sw - 1; x >= 0; --x) { 8370e3c664250f561ec9f7107b92136517a72d03afdreed@android.com if (*src) { 8388a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com *dst = SkToU8(SkAlphaMul(*dst, SkAlpha255To256(255 - *src))); 8390e3c664250f561ec9f7107b92136517a72d03afdreed@android.com } 8408a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com dst += 1; 8418a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com src += 1; 8428a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 8438a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com break; 8448a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com default: 8450c00f21fee3f5cfa3aa7e5d46ff94cb8cf340451tomhudson@google.com SkDEBUGFAIL("Unexpected blur style here"); 8468a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com break; 8478a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 8488a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com dst += dstRowBytes - sw; 8490e3c664250f561ec9f7107b92136517a72d03afdreed@android.com src += srcRowBytes - sw; 8508a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 8518a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com} 8528a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 85303016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com/////////////////////////////////////////////////////////////////////////////// 8548a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 8558a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com// we use a local funciton to wrap the class static method to work around 8568a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com// a bug in gcc98 8578a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.comvoid SkMask_FreeImage(uint8_t* image); 85803016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.comvoid SkMask_FreeImage(uint8_t* image) { 8598a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com SkMask::FreeImage(image); 8608a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com} 8618a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 8628a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.combool SkBlurMask::Blur(SkMask* dst, const SkMask& src, 8635af16f8d670b3ce1c7644a4737e02e2e2257614ebungeman@google.com SkScalar radius, Style style, Quality quality, 86471f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org SkIPoint* margin, bool separable) 8655af16f8d670b3ce1c7644a4737e02e2e2257614ebungeman@google.com{ 86603016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com if (src.fFormat != SkMask::kA8_Format) { 8678a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com return false; 86803016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com } 8698a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 8704868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org // Force high quality off for small radii (performance) 87191f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org if (radius < SkIntToScalar(3)) { 87291f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org quality = kLow_Quality; 87391f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org } 8744868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org 8754868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org // highQuality: use three box blur passes as a cheap way to approximate a Gaussian blur 87691f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org int passCount = (kHigh_Quality == quality) ? 3 : 1; 8777c7292c6071898d73dc935c3b66b9816183806f0humper@google.com SkScalar passRadius = (kHigh_Quality == quality) ? SkScalarMul( radius, kBlurRadiusFudgeFactor): radius; 8784868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org 8794868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org int rx = SkScalarCeil(passRadius); 8804868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org int outer_weight = 255 - SkScalarRound((SkIntToScalar(rx) - passRadius) * 255); 8818a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 8828a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com SkASSERT(rx >= 0); 8838a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com SkASSERT((unsigned)outer_weight <= 255); 8840e3c664250f561ec9f7107b92136517a72d03afdreed@android.com if (rx <= 0) { 8858a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com return false; 8860e3c664250f561ec9f7107b92136517a72d03afdreed@android.com } 8878a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 8888a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com int ry = rx; // only do square blur for now 8898a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 8904868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org int padx = passCount * rx; 8914868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org int pady = passCount * ry; 8925af16f8d670b3ce1c7644a4737e02e2e2257614ebungeman@google.com if (margin) { 8935af16f8d670b3ce1c7644a4737e02e2e2257614ebungeman@google.com margin->set(padx, pady); 8945af16f8d670b3ce1c7644a4737e02e2e2257614ebungeman@google.com } 8954868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org dst->fBounds.set(src.fBounds.fLeft - padx, src.fBounds.fTop - pady, 8964868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org src.fBounds.fRight + padx, src.fBounds.fBottom + pady); 89749f0ff25a046d6001dc2d095b6fa3c30f0f46b6areed@android.com dst->fRowBytes = dst->fBounds.width(); 8988a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com dst->fFormat = SkMask::kA8_Format; 8998a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com dst->fImage = NULL; 9008a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 9010e3c664250f561ec9f7107b92136517a72d03afdreed@android.com if (src.fImage) { 902543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com size_t dstSize = dst->computeImageSize(); 903543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com if (0 == dstSize) { 904543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com return false; // too big to allocate, abort 905543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com } 906543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com 9078a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com int sw = src.fBounds.width(); 9088a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com int sh = src.fBounds.height(); 9098a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com const uint8_t* sp = src.fImage; 910543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com uint8_t* dp = SkMask::AllocImage(dstSize); 9118a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 9128a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com SkAutoTCallVProc<uint8_t, SkMask_FreeImage> autoCall(dp); 9138a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 9148a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com // build the blurry destination 91571f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org if (separable) { 91671f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org SkAutoTMalloc<uint8_t> tmpBuffer(dstSize); 91771f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org uint8_t* tp = tmpBuffer.get(); 91871f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org int w = sw, h = sh; 91971f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org 92091f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org if (outer_weight == 255) { 921c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org int loRadius, hiRadius; 922c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org get_adjusted_radii(passRadius, &loRadius, &hiRadius); 92391f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org if (kHigh_Quality == quality) { 92491f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org // Do three X blurs, with a transpose on the final one. 92591f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org w = boxBlur(sp, src.fRowBytes, tp, loRadius, hiRadius, w, h, false); 92691f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org w = boxBlur(tp, w, dp, hiRadius, loRadius, w, h, false); 92791f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org w = boxBlur(dp, w, tp, hiRadius, hiRadius, w, h, true); 92891f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org // Do three Y blurs, with a transpose on the final one. 92991f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org h = boxBlur(tp, h, dp, loRadius, hiRadius, h, w, false); 93091f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org h = boxBlur(dp, h, tp, hiRadius, loRadius, h, w, false); 93191f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org h = boxBlur(tp, h, dp, hiRadius, hiRadius, h, w, true); 93291f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org } else { 93391f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org w = boxBlur(sp, src.fRowBytes, tp, rx, rx, w, h, true); 93491f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org h = boxBlur(tp, h, dp, ry, ry, h, w, true); 93591f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org } 936908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org } else { 93791f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org if (kHigh_Quality == quality) { 93891f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org // Do three X blurs, with a transpose on the final one. 93991f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org w = boxBlurInterp(sp, src.fRowBytes, tp, rx, w, h, false, outer_weight); 94091f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org w = boxBlurInterp(tp, w, dp, rx, w, h, false, outer_weight); 94191f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org w = boxBlurInterp(dp, w, tp, rx, w, h, true, outer_weight); 94291f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org // Do three Y blurs, with a transpose on the final one. 94391f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org h = boxBlurInterp(tp, h, dp, ry, h, w, false, outer_weight); 94491f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org h = boxBlurInterp(dp, h, tp, ry, h, w, false, outer_weight); 94591f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org h = boxBlurInterp(tp, h, dp, ry, h, w, true, outer_weight); 94691f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org } else { 94791f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org w = boxBlurInterp(sp, src.fRowBytes, tp, rx, w, h, true, outer_weight); 94891f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org h = boxBlurInterp(tp, h, dp, ry, h, w, true, outer_weight); 94991f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org } 95071f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org } 95171f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org } else { 95203016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com const size_t storageW = sw + 2 * (passCount - 1) * rx + 1; 95303016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com const size_t storageH = sh + 2 * (passCount - 1) * ry + 1; 95403016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com SkAutoTMalloc<uint32_t> storage(storageW * storageH); 9558a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com uint32_t* sumBuffer = storage.get(); 9568a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 9574868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org //pass1: sp is source, dp is destination 9588a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com build_sum_buffer(sumBuffer, sw, sh, sp, src.fRowBytes); 95903016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com if (outer_weight == 255) { 9608a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com apply_kernel(dp, rx, ry, sumBuffer, sw, sh); 96103016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com } else { 9628a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com apply_kernel_interp(dp, rx, ry, sumBuffer, sw, sh, outer_weight); 96303016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com } 9644868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org 96591f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org if (kHigh_Quality == quality) { 9664868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org //pass2: dp is source, tmpBuffer is destination 9674868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org int tmp_sw = sw + 2 * rx; 9684868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org int tmp_sh = sh + 2 * ry; 9694868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org SkAutoTMalloc<uint8_t> tmpBuffer(dstSize); 9704868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org build_sum_buffer(sumBuffer, tmp_sw, tmp_sh, dp, tmp_sw); 9714868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org if (outer_weight == 255) 9724868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org apply_kernel(tmpBuffer.get(), rx, ry, sumBuffer, tmp_sw, tmp_sh); 9734868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org else 97403016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com apply_kernel_interp(tmpBuffer.get(), rx, ry, sumBuffer, 97503016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com tmp_sw, tmp_sh, outer_weight); 9764868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org 9774868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org //pass3: tmpBuffer is source, dp is destination 9784868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org tmp_sw += 2 * rx; 9794868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org tmp_sh += 2 * ry; 9804868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org build_sum_buffer(sumBuffer, tmp_sw, tmp_sh, tmpBuffer.get(), tmp_sw); 9814868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org if (outer_weight == 255) 9824868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org apply_kernel(dp, rx, ry, sumBuffer, tmp_sw, tmp_sh); 9834868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org else 98403016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com apply_kernel_interp(dp, rx, ry, sumBuffer, tmp_sw, tmp_sh, 98503016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com outer_weight); 9864868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org } 9878a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 9888a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 9898a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com dst->fImage = dp; 9908a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com // if need be, alloc the "real" dst (same size as src) and copy/merge 9918a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com // the blur into it (applying the src) 9920e3c664250f561ec9f7107b92136517a72d03afdreed@android.com if (style == kInner_Style) { 9930e3c664250f561ec9f7107b92136517a72d03afdreed@android.com // now we allocate the "real" dst, mirror the size of src 994543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com size_t srcSize = src.computeImageSize(); 995543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com if (0 == srcSize) { 996543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com return false; // too big to allocate, abort 997543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com } 998543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com dst->fImage = SkMask::AllocImage(srcSize); 9990e3c664250f561ec9f7107b92136517a72d03afdreed@android.com merge_src_with_blur(dst->fImage, src.fRowBytes, 10000e3c664250f561ec9f7107b92136517a72d03afdreed@android.com sp, src.fRowBytes, 100103016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com dp + passCount * (rx + ry * dst->fRowBytes), 100203016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com dst->fRowBytes, sw, sh); 10038a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com SkMask::FreeImage(dp); 10040e3c664250f561ec9f7107b92136517a72d03afdreed@android.com } else if (style != kNormal_Style) { 100503016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com clamp_with_orig(dp + passCount * (rx + ry * dst->fRowBytes), 100603016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com dst->fRowBytes, sp, src.fRowBytes, sw, sh, style); 10078a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 10088a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com (void)autoCall.detach(); 10098a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 10108a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 10110e3c664250f561ec9f7107b92136517a72d03afdreed@android.com if (style == kInner_Style) { 10128a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com dst->fBounds = src.fBounds; // restore trimmed bounds 10130e3c664250f561ec9f7107b92136517a72d03afdreed@android.com dst->fRowBytes = src.fRowBytes; 10148a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 10158a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 10168a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com return true; 10178a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com} 10188a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 101971f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.orgbool SkBlurMask::BlurSeparable(SkMask* dst, const SkMask& src, 102071f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org SkScalar radius, Style style, Quality quality, 102171f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org SkIPoint* margin) 102271f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org{ 102371f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org return SkBlurMask::Blur(dst, src, radius, style, quality, margin, true); 102471f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org} 102571f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org 102671f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.orgbool SkBlurMask::Blur(SkMask* dst, const SkMask& src, 102771f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org SkScalar radius, Style style, Quality quality, 102871f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org SkIPoint* margin) 102971f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org{ 103071f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org return SkBlurMask::Blur(dst, src, radius, style, quality, margin, false); 103171f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org} 10327c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 10337c7292c6071898d73dc935c3b66b9816183806f0humper@google.com/* Convolving a box with itself three times results in a piecewise 10347c7292c6071898d73dc935c3b66b9816183806f0humper@google.com quadratic function: 10358ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 10367c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 0 x <= -1.5 10377c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 9/8 + 3/2 x + 1/2 x^2 -1.5 < x <= 1.5 10387c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 3/4 - x^2 -.5 < x <= .5 10397c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 9/8 - 3/2 x + 1/2 x^2 0.5 < x <= 1.5 10407c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 0 1.5 < x 10418ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 10427c7292c6071898d73dc935c3b66b9816183806f0humper@google.com To get the profile curve of the blurred step function at the rectangle 10437c7292c6071898d73dc935c3b66b9816183806f0humper@google.com edge, we evaluate the indefinite integral, which is piecewise cubic: 10448ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 10457c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 0 x <= -1.5 10467c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 5/8 + 9/8 x + 3/4 x^2 + 1/6 x^3 -1.5 < x <= -0.5 10477c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 1/2 + 3/4 x - 1/3 x^3 -.5 < x <= .5 10487c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 3/8 + 9/8 x - 3/4 x^2 + 1/6 x^3 .5 < x <= 1.5 10497c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 1 1.5 < x 10507c7292c6071898d73dc935c3b66b9816183806f0humper@google.com*/ 10517c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 10527c7292c6071898d73dc935c3b66b9816183806f0humper@google.comstatic float gaussian_integral( float x ) { 10537c7292c6071898d73dc935c3b66b9816183806f0humper@google.com if ( x > 1.5f ) { 10547c7292c6071898d73dc935c3b66b9816183806f0humper@google.com return 0.0f; 10557c7292c6071898d73dc935c3b66b9816183806f0humper@google.com } 10567c7292c6071898d73dc935c3b66b9816183806f0humper@google.com if ( x < -1.5f ) { 10577c7292c6071898d73dc935c3b66b9816183806f0humper@google.com return 1.0f; 10587c7292c6071898d73dc935c3b66b9816183806f0humper@google.com } 10597c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 10607c7292c6071898d73dc935c3b66b9816183806f0humper@google.com float x2 = x*x; 10617c7292c6071898d73dc935c3b66b9816183806f0humper@google.com float x3 = x2*x; 10627c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 10639c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com if ( x > 0.5f ) { 10649c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com return 0.5625f - ( x3 / 6.0f - 3.0f * x2 * 0.25f + 1.125f * x); 10657c7292c6071898d73dc935c3b66b9816183806f0humper@google.com } 10669c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com if ( x > -0.5f ) { 10679c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com return 0.5f - (0.75f * x - x3 / 3.0f); 10687c7292c6071898d73dc935c3b66b9816183806f0humper@google.com } 10699c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com return 0.4375f + (-x3 / 6.0f - 3.0f * x2 * 0.25f - 1.125f * x); 10707c7292c6071898d73dc935c3b66b9816183806f0humper@google.com} 10717c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 10728ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com/* 10737c7292c6071898d73dc935c3b66b9816183806f0humper@google.com compute_profile allocates and fills in an array of floating 10748ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com point values between 0 and 255 for the profile signature of 10757c7292c6071898d73dc935c3b66b9816183806f0humper@google.com a blurred half-plane with the given blur radius. Since we're 10767c7292c6071898d73dc935c3b66b9816183806f0humper@google.com going to be doing screened multiplications (i.e., 1 - (1-x)(1-y)) 10777c7292c6071898d73dc935c3b66b9816183806f0humper@google.com all the time, we actually fill in the profile pre-inverted 10787c7292c6071898d73dc935c3b66b9816183806f0humper@google.com (already done 255-x). 10798ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 10807c7292c6071898d73dc935c3b66b9816183806f0humper@google.com The function returns the size of the array allocated for the 10818ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com profile. It's the responsibility of the caller to delete the 10827c7292c6071898d73dc935c3b66b9816183806f0humper@google.com memory returned in profile_out. 10837c7292c6071898d73dc935c3b66b9816183806f0humper@google.com*/ 10847c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 10857c7292c6071898d73dc935c3b66b9816183806f0humper@google.comstatic int compute_profile( SkScalar radius, unsigned int **profile_out ) { 10869c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com int size = SkScalarFloorToInt(radius * 3 + 1); 10877c7292c6071898d73dc935c3b66b9816183806f0humper@google.com int center = size >> 1; 10887c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 10897c7292c6071898d73dc935c3b66b9816183806f0humper@google.com unsigned int *profile = new unsigned int [size]; 10907c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 10917c7292c6071898d73dc935c3b66b9816183806f0humper@google.com float invr = 1.0f/radius; 10927c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 10937c7292c6071898d73dc935c3b66b9816183806f0humper@google.com profile[0] = 255; 10947c7292c6071898d73dc935c3b66b9816183806f0humper@google.com for (int x = 1 ; x < size ; x++) { 10957c7292c6071898d73dc935c3b66b9816183806f0humper@google.com float scaled_x = ( center - x ) * invr; 10967c7292c6071898d73dc935c3b66b9816183806f0humper@google.com float gi = gaussian_integral( scaled_x ); 10977c7292c6071898d73dc935c3b66b9816183806f0humper@google.com profile[x] = 255 - (uint8_t) ( 255.f * gi ); 10987c7292c6071898d73dc935c3b66b9816183806f0humper@google.com } 10997c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 11007c7292c6071898d73dc935c3b66b9816183806f0humper@google.com *profile_out = profile; 11017c7292c6071898d73dc935c3b66b9816183806f0humper@google.com return size; 11027c7292c6071898d73dc935c3b66b9816183806f0humper@google.com} 11037c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 11048ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com// TODO MAYBE: Maintain a profile cache to avoid recomputing this for 11057c7292c6071898d73dc935c3b66b9816183806f0humper@google.com// commonly used radii. Consider baking some of the most common blur radii 11067c7292c6071898d73dc935c3b66b9816183806f0humper@google.com// directly in as static data? 11077c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 11087c7292c6071898d73dc935c3b66b9816183806f0humper@google.com// Implementation adapted from Michael Herf's approach: 11097c7292c6071898d73dc935c3b66b9816183806f0humper@google.com// http://stereopsis.com/shadowrect/ 11107c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 11117c7292c6071898d73dc935c3b66b9816183806f0humper@google.combool SkBlurMask::BlurRect(SkMask *dst, const SkRect &src, 11127c7292c6071898d73dc935c3b66b9816183806f0humper@google.com SkScalar provided_radius, Style style, Quality quality, 11137c7292c6071898d73dc935c3b66b9816183806f0humper@google.com SkIPoint *margin) { 11147c7292c6071898d73dc935c3b66b9816183806f0humper@google.com int profile_size; 11157c7292c6071898d73dc935c3b66b9816183806f0humper@google.com unsigned int *profile; 11168ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 11178ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 11187c7292c6071898d73dc935c3b66b9816183806f0humper@google.com float radius = SkScalarToFloat( SkScalarMul( provided_radius, kBlurRadiusFudgeFactor ) ); 11198ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 11207c7292c6071898d73dc935c3b66b9816183806f0humper@google.com profile_size = compute_profile( radius, &profile ); 11218ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 11227c7292c6071898d73dc935c3b66b9816183806f0humper@google.com int pad = (int) (radius * 1.5f + 1); 11237c7292c6071898d73dc935c3b66b9816183806f0humper@google.com if (margin) { 11247c7292c6071898d73dc935c3b66b9816183806f0humper@google.com margin->set( pad, pad ); 11257c7292c6071898d73dc935c3b66b9816183806f0humper@google.com } 11269c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com dst->fBounds = SkIRect::MakeWH(SkScalarFloorToInt(src.width()), SkScalarFloorToInt(src.height())); 11277c7292c6071898d73dc935c3b66b9816183806f0humper@google.com dst->fBounds.outset(pad, pad); 11288ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 11297c7292c6071898d73dc935c3b66b9816183806f0humper@google.com dst->fRowBytes = dst->fBounds.width(); 11307c7292c6071898d73dc935c3b66b9816183806f0humper@google.com dst->fFormat = SkMask::kA8_Format; 11317c7292c6071898d73dc935c3b66b9816183806f0humper@google.com dst->fImage = NULL; 11328ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 11337c7292c6071898d73dc935c3b66b9816183806f0humper@google.com size_t dstSize = dst->computeImageSize(); 11347c7292c6071898d73dc935c3b66b9816183806f0humper@google.com if (0 == dstSize) { 11357c7292c6071898d73dc935c3b66b9816183806f0humper@google.com return false; // too big to allocate, abort 11367c7292c6071898d73dc935c3b66b9816183806f0humper@google.com } 11378ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 11389c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com int sw = SkScalarFloorToInt(src.width()); 11399c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com int sh = SkScalarFloorToInt(src.height()); 11408ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 11417c7292c6071898d73dc935c3b66b9816183806f0humper@google.com uint8_t* dp = SkMask::AllocImage(dstSize); 11428ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 11437c7292c6071898d73dc935c3b66b9816183806f0humper@google.com dst->fImage = dp; 11448ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 11457c7292c6071898d73dc935c3b66b9816183806f0humper@google.com SkAutoTCallVProc<uint8_t, SkMask_FreeImage> autoCall(dp); 11468ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 11477c7292c6071898d73dc935c3b66b9816183806f0humper@google.com int dst_height = dst->fBounds.height(); 11487c7292c6071898d73dc935c3b66b9816183806f0humper@google.com int dst_width = dst->fBounds.width(); 11498ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 11507c7292c6071898d73dc935c3b66b9816183806f0humper@google.com // nearest odd number less than the profile size represents the center 11517c7292c6071898d73dc935c3b66b9816183806f0humper@google.com // of the (2x scaled) profile 11527c7292c6071898d73dc935c3b66b9816183806f0humper@google.com int center = ( profile_size & ~1 ) - 1; 11538ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 11547c7292c6071898d73dc935c3b66b9816183806f0humper@google.com int w = sw - center; 11557c7292c6071898d73dc935c3b66b9816183806f0humper@google.com int h = sh - center; 11568ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 11577c7292c6071898d73dc935c3b66b9816183806f0humper@google.com uint8_t *outptr = dp; 11588ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 11597c7292c6071898d73dc935c3b66b9816183806f0humper@google.com for (int y = 0 ; y < dst_height ; y++) 11607c7292c6071898d73dc935c3b66b9816183806f0humper@google.com { 11617c7292c6071898d73dc935c3b66b9816183806f0humper@google.com // time to fill in a scanline of the blurry rectangle. 11627c7292c6071898d73dc935c3b66b9816183806f0humper@google.com // to avoid floating point math, everything is multiplied by 11637c7292c6071898d73dc935c3b66b9816183806f0humper@google.com // 2 where needed. This keeps things nice and integer-oriented. 11648ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 11657c7292c6071898d73dc935c3b66b9816183806f0humper@google.com int dy = abs((y << 1) - dst_height) - h; // how far are we from the original edge? 11667c7292c6071898d73dc935c3b66b9816183806f0humper@google.com int oy = dy >> 1; 11677c7292c6071898d73dc935c3b66b9816183806f0humper@google.com if (oy < 0) oy = 0; 11688ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 11697c7292c6071898d73dc935c3b66b9816183806f0humper@google.com unsigned int profile_y = profile[oy]; 11708ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 11717c7292c6071898d73dc935c3b66b9816183806f0humper@google.com for (int x = 0 ; x < (dst_width << 1) ; x += 2) { 11727c7292c6071898d73dc935c3b66b9816183806f0humper@google.com int dx = abs( x - dst_width ) - w; 11737c7292c6071898d73dc935c3b66b9816183806f0humper@google.com int ox = dx >> 1; 11747c7292c6071898d73dc935c3b66b9816183806f0humper@google.com if (ox < 0) ox = 0; 11758ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 11767c7292c6071898d73dc935c3b66b9816183806f0humper@google.com unsigned int maskval = SkMulDiv255Round(profile[ox], profile_y); 11778ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 11787c7292c6071898d73dc935c3b66b9816183806f0humper@google.com *(outptr++) = maskval; 11797c7292c6071898d73dc935c3b66b9816183806f0humper@google.com } 11807c7292c6071898d73dc935c3b66b9816183806f0humper@google.com } 11818ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 11827c7292c6071898d73dc935c3b66b9816183806f0humper@google.com return true; 11837c7292c6071898d73dc935c3b66b9816183806f0humper@google.com} 1184