SkBlurMask.cpp revision 76bf70d38fd109a09ee44d074cfd392e1884afff
1ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com 2ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com/* 3ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com * Copyright 2006 The Android Open Source Project 4ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com * 5ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com * Use of this source code is governed by a BSD-style license that can be 6ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com * found in the LICENSE file. 7ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com */ 8ec3ed6a5ebf6f2c406d7bcf94b6bc34fcaeb976eepoger@google.com 98a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 108a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com#include "SkBlurMask.h" 11889bd8bd7f604acae0a6303365bc82c06da1e6f3tomhudson@google.com#include "SkMath.h" 128a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com#include "SkTemplates.h" 1301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#include "SkEndian.h" 1401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com 158ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com// scale factor for the blur radius to match the behavior of the all existing blur 167c7292c6071898d73dc935c3b66b9816183806f0humper@google.com// code (both on the CPU and the GPU). This magic constant is 1/sqrt(3). 177c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 188ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com// TODO: get rid of this fudge factor and move any required fudging up into 197c7292c6071898d73dc935c3b66b9816183806f0humper@google.com// the calling library 207c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 217c7292c6071898d73dc935c3b66b9816183806f0humper@google.com#define kBlurRadiusFudgeFactor SkFloatToScalar( .57735f ) 227c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 239b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define UNROLL_SEPARABLE_LOOPS 249b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org 25908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org/** 26908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org * This function performs a box blur in X, of the given radius. If the 27884e60be30e20f38b3466a4697081187d2f1f814skia.committer@gmail.com * "transpose" parameter is true, it will transpose the pixels on write, 28908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org * such that X and Y are swapped. Reads are always performed from contiguous 29908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org * memory in X, for speed. The destination buffer (dst) must be at least 309b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org * (width + leftRadius + rightRadius) * height bytes in size. 314a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * 324a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * This is what the inner loop looks like before unrolling, and with the two 334a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * cases broken out separately (width < diameter, width >= diameter): 3476bf70d38fd109a09ee44d074cfd392e1884afffskia.committer@gmail.com * 354a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * if (width < diameter) { 364a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * for (int x = 0; x < width; ++x) { 374a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * sum += *right++; 3876bf70d38fd109a09ee44d074cfd392e1884afffskia.committer@gmail.com * *dptr = (sum * scale + half) >> 24; 394a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * dptr += dst_x_stride; 404a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * } 414a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * for (int x = width; x < diameter; ++x) { 424a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * *dptr = (sum * scale + half) >> 24; 434a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * dptr += dst_x_stride; 444a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * } 454a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * for (int x = 0; x < width; ++x) { 464a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * *dptr = (sum * scale + half) >> 24; 474a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * sum -= *left++; 484a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * dptr += dst_x_stride; 494a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * } 504a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * } else { 514a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * for (int x = 0; x < diameter; ++x) { 524a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * sum += *right++; 534a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * *dptr = (sum * scale + half) >> 24; 544a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * dptr += dst_x_stride; 554a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * } 564a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * for (int x = diameter; x < width; ++x) { 574a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * sum += *right++; 584a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * *dptr = (sum * scale + half) >> 24; 594a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * sum -= *left++; 604a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * dptr += dst_x_stride; 614a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * } 624a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * for (int x = 0; x < diameter; ++x) { 634a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * *dptr = (sum * scale + half) >> 24; 644a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * sum -= *left++; 654a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * dptr += dst_x_stride; 664a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * } 674a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * } 68908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org */ 69908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.orgstatic int boxBlur(const uint8_t* src, int src_y_stride, uint8_t* dst, 70c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org int leftRadius, int rightRadius, int width, int height, 71c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org bool transpose) 7271f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org{ 739b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org int diameter = leftRadius + rightRadius; 749b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org int kernelSize = diameter + 1; 759b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org int border = SkMin32(width, diameter); 7671f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org uint32_t scale = (1 << 24) / kernelSize; 77c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org int new_width = width + SkMax32(leftRadius, rightRadius) * 2; 78908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org int dst_x_stride = transpose ? height : 1; 79908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org int dst_y_stride = transpose ? 1 : new_width; 804a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org#ifndef SK_DISABLE_BLUR_ROUNDING 814a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org uint32_t half = 1 << 23; 824a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org#else 834a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org uint32_t half = 0; 844a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org#endif 8571f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org for (int y = 0; y < height; ++y) { 864a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org uint32_t sum = 0; 87908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org uint8_t* dptr = dst + y * dst_y_stride; 88908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org const uint8_t* right = src + y * src_y_stride; 89908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org const uint8_t* left = right; 90336b4da6b0d20f27f9980b03415354a2f0698e18senorblanco@chromium.org for (int x = 0; x < rightRadius - leftRadius; x++) { 91336b4da6b0d20f27f9980b03415354a2f0698e18senorblanco@chromium.org *dptr = 0; 92336b4da6b0d20f27f9980b03415354a2f0698e18senorblanco@chromium.org dptr += dst_x_stride; 93c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org } 949b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define LEFT_BORDER_ITER \ 959b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org sum += *right++; \ 964a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *dptr = (sum * scale + half) >> 24; \ 97908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org dptr += dst_x_stride; 989b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org 999b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org int x = 0; 1009b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS 1019b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (; x < border - 16; x += 16) { 1029b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 1039b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 1049b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 1059b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 1069b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 1079b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 1089b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 1099b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 1109b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 1119b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 1129b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 1139b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 1149b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 1159b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 1169b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 1179b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 11871f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org } 1199b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif 1209b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (; x < border; ++x) { 1219b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 1229b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org } 1239b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef LEFT_BORDER_ITER 1249b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define TRIVIAL_ITER \ 1254a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *dptr = (sum * scale + half) >> 24; \ 126908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org dptr += dst_x_stride; 1279b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org x = width; 1289b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS 1299b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (; x < diameter - 16; x += 16) { 1309b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 1319b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 1329b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 1339b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 1349b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 1359b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 1369b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 1379b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 1389b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 1399b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 1409b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 1419b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 1429b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 1439b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 1449b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 1459b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 1469b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org } 1479b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif 1489b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (; x < diameter; ++x) { 1499b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org TRIVIAL_ITER 15071f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org } 1519b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef TRIVIAL_ITER 1529b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define CENTER_ITER \ 1539b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org sum += *right++; \ 1544a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *dptr = (sum * scale + half) >> 24; \ 1559b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org sum -= *left++; \ 156908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org dptr += dst_x_stride; 1579b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org 1589b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org x = diameter; 1599b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS 1609b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (; x < width - 16; x += 16) { 1619b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1629b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1639b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1649b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1659b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1669b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1679b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1689b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1699b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1709b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1719b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1729b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1739b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1749b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1759b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1769b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 1779b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org } 1789b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif 1799b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (; x < width; ++x) { 1809b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 18171f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org } 1829b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef CENTER_ITER 1839b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define RIGHT_BORDER_ITER \ 1844a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *dptr = (sum * scale + half) >> 24; \ 1859b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org sum -= *left++; \ 186908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org dptr += dst_x_stride; 1879b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org 1889b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org x = 0; 1899b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS 1909b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (; x < border - 16; x += 16) { 1919b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 1929b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 1939b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 1949b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 1959b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 1969b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 1979b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 1989b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 1999b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 2009b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 2019b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 2029b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 2039b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 2049b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 2059b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 2069b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 2079b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org } 2089b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif 2099b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (; x < border; ++x) { 2109b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 21171f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org } 2129b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef RIGHT_BORDER_ITER 213336b4da6b0d20f27f9980b03415354a2f0698e18senorblanco@chromium.org for (int x = 0; x < leftRadius - rightRadius; x++) { 214336b4da6b0d20f27f9980b03415354a2f0698e18senorblanco@chromium.org *dptr = 0; 215336b4da6b0d20f27f9980b03415354a2f0698e18senorblanco@chromium.org dptr += dst_x_stride; 216c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org } 21771f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org SkASSERT(sum == 0); 21871f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org } 219908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org return new_width; 22071f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org} 22171f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org 2229b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org/** 2239b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org * This variant of the box blur handles blurring of non-integer radii. It 2249b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org * keeps two running sums: an outer sum for the rounded-up kernel radius, and 2259b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org * an inner sum for the rounded-down kernel radius. For each pixel, it linearly 2269b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org * interpolates between them. In float this would be: 2279b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org * outer_weight * outer_sum / kernelSize + 2289b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org * (1.0 - outer_weight) * innerSum / (kernelSize - 2) 22976bf70d38fd109a09ee44d074cfd392e1884afffskia.committer@gmail.com * 2304a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * This is what the inner loop looks like before unrolling, and with the two 2314a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * cases broken out separately (width < diameter, width >= diameter): 23276bf70d38fd109a09ee44d074cfd392e1884afffskia.committer@gmail.com * 2334a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * if (width < diameter) { 2344a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * for (int x = 0; x < width; x++) { 2354a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * inner_sum = outer_sum; 2364a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * outer_sum += *right++; 2374a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * *dptr = (outer_sum * outer_scale + inner_sum * inner_scale + half) >> 24; 2384a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * dptr += dst_x_stride; 2394a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * } 2404a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * for (int x = width; x < diameter; ++x) { 2414a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * *dptr = (outer_sum * outer_scale + inner_sum * inner_scale + half) >> 24; 2424a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * dptr += dst_x_stride; 2434a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * } 2444a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * for (int x = 0; x < width; x++) { 2454a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * inner_sum = outer_sum - *left++; 2464a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * *dptr = (outer_sum * outer_scale + inner_sum * inner_scale + half) >> 24; 2474a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * dptr += dst_x_stride; 2484a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * outer_sum = inner_sum; 2494a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * } 2504a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * } else { 2514a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * for (int x = 0; x < diameter; x++) { 2524a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * inner_sum = outer_sum; 2534a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * outer_sum += *right++; 2544a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * *dptr = (outer_sum * outer_scale + inner_sum * inner_scale + half) >> 24; 2554a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * dptr += dst_x_stride; 2564a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * } 2574a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * for (int x = diameter; x < width; ++x) { 2584a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * inner_sum = outer_sum - *left; 2594a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * outer_sum += *right++; 2604a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * *dptr = (outer_sum * outer_scale + inner_sum * inner_scale + half) >> 24; 2614a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * dptr += dst_x_stride; 2624a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * outer_sum -= *left++; 2634a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * } 2644a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * for (int x = 0; x < diameter; x++) { 2654a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * inner_sum = outer_sum - *left++; 2664a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * *dptr = (outer_sum * outer_scale + inner_sum * inner_scale + half) >> 24; 2674a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * dptr += dst_x_stride; 2684a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * outer_sum = inner_sum; 2694a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * } 2704a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * } 2714a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * } 2724a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org * return new_width; 2739b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org */ 2744a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org 2759b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.orgstatic int boxBlurInterp(const uint8_t* src, int src_y_stride, uint8_t* dst, 2769b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org int radius, int width, int height, 2779b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org bool transpose, uint8_t outer_weight) 2789b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org{ 2799b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org int diameter = radius * 2; 2809b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org int kernelSize = diameter + 1; 2819b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org int border = SkMin32(width, diameter); 2829b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org int inner_weight = 255 - outer_weight; 2839b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org outer_weight += outer_weight >> 7; 2849b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org inner_weight += inner_weight >> 7; 2859b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org uint32_t outer_scale = (outer_weight << 16) / kernelSize; 2869b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org uint32_t inner_scale = (inner_weight << 16) / (kernelSize - 2); 2874a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org#ifndef SK_DISABLE_BLUR_ROUNDING 2884a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org uint32_t half = 1 << 23; 2894a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org#else 2904a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org uint32_t half = 0; 2914a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org#endif 2929b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org int new_width = width + diameter; 2939b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org int dst_x_stride = transpose ? height : 1; 2949b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org int dst_y_stride = transpose ? 1 : new_width; 2959b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (int y = 0; y < height; ++y) { 2964a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org uint32_t outer_sum = 0, inner_sum = 0; 2979b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org uint8_t* dptr = dst + y * dst_y_stride; 2989b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org const uint8_t* right = src + y * src_y_stride; 2999b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org const uint8_t* left = right; 3009b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org int x = 0; 3019b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org 3029b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define LEFT_BORDER_ITER \ 3039b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org inner_sum = outer_sum; \ 3049b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org outer_sum += *right++; \ 3054a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *dptr = (outer_sum * outer_scale + inner_sum * inner_scale + half) >> 24; \ 3069b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org dptr += dst_x_stride; 3079b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org 3089b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS 3099b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (;x < border - 16; x += 16) { 3109b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 3119b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 3129b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 3139b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 3149b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 3159b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 3169b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 3179b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 3189b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 3199b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 3209b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 3219b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 3229b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 3239b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 3249b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 3259b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 3269b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org } 3279b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif 3289b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org 3299b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (;x < border; x++) { 3309b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org LEFT_BORDER_ITER 3319b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org } 3329b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef LEFT_BORDER_ITER 3339b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (int x = width; x < diameter; ++x) { 3344a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *dptr = (outer_sum * outer_scale + inner_sum * inner_scale + half) >> 24; 3359b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org dptr += dst_x_stride; 3369b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org } 3379b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org x = diameter; 3389b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org 3399b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#define CENTER_ITER \ 3409b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org inner_sum = outer_sum - *left; \ 3419b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org outer_sum += *right++; \ 3424a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *dptr = (outer_sum * outer_scale + inner_sum * inner_scale + half) >> 24; \ 3439b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org dptr += dst_x_stride; \ 3449b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org outer_sum -= *left++; 3459b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org 3469b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS 3479b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (; x < width - 16; x += 16) { 3489b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 3499b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 3509b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 3519b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 3529b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 3539b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 3549b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 3559b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 3569b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 3579b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 3589b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 3599b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 3609b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 3619b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 3629b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 3639b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 3649b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org } 3659b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif 3669b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (; x < width; ++x) { 3679b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org CENTER_ITER 3689b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org } 3699b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef CENTER_ITER 3709b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org 3719b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org #define RIGHT_BORDER_ITER \ 3729b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org inner_sum = outer_sum - *left++; \ 3734a525d7fc2cc0d8029bc66095730ddba3df3cb9esenorblanco@chromium.org *dptr = (outer_sum * outer_scale + inner_sum * inner_scale + half) >> 24; \ 3749b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org dptr += dst_x_stride; \ 3759b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org outer_sum = inner_sum; 3769b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org 3779b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org x = 0; 3789b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#ifdef UNROLL_SEPARABLE_LOOPS 3799b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (; x < border - 16; x += 16) { 3809b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 3819b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 3829b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 3839b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 3849b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 3859b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 3869b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 3879b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 3889b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 3899b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 3909b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 3919b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 3929b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 3939b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 3949b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 3959b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 3969b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org } 3979b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#endif 3989b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org for (; x < border; x++) { 3999b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org RIGHT_BORDER_ITER 4009b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org } 4019b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org#undef RIGHT_BORDER_ITER 4029b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org SkASSERT(outer_sum == 0 && inner_sum == 0); 4039b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org } 4049b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org return new_width; 4059b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org} 4069b0d4d79f023ce91b53d9eaa47508b6722c246e6senorblanco@chromium.org 407c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.orgstatic void get_adjusted_radii(SkScalar passRadius, int *loRadius, int *hiRadius) 408c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org{ 409c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org *loRadius = *hiRadius = SkScalarCeil(passRadius); 410c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org if (SkIntToScalar(*hiRadius) - passRadius > SkFloatToScalar(0.5f)) { 411c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org *loRadius = *hiRadius - 1; 412c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org } 413c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org} 414c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org 41501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com// Unrolling the integer blur kernel seems to give us a ~15% speedup on Windows, 41601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com// breakeven on Mac, and ~15% slowdown on Linux. 41701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com// Reading a word at a time when bulding the sum buffer seems to give 41801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com// us no appreciable speedup on Windows or Mac, and 2% slowdown on Linux. 419054ff1efa4f9187ce7fd20aaf3aed7cecf14e12btomhudson@google.com#if defined(SK_BUILD_FOR_WIN32) 42001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#define UNROLL_KERNEL_LOOP 1 42101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#endif 4228a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 4234560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com/** The sum buffer is an array of u32 to hold the accumulated sum of all of the 4244560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com src values at their position, plus all values above and to the left. 4254560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com When we sample into this buffer, we need an initial row and column of 0s, 4264560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com so we have an index correspondence as follows: 427fbfcd5602128ec010c82cb733c9cdc0a3254f9f3rmistry@google.com 4284560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com src[i, j] == sum[i+1, j+1] 4294560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com sum[0, j] == sum[i, 0] == 0 430fbfcd5602128ec010c82cb733c9cdc0a3254f9f3rmistry@google.com 4314560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com We assume that the sum buffer's stride == its width 4324560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com */ 43303016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.comstatic void build_sum_buffer(uint32_t sum[], int srcW, int srcH, 43403016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com const uint8_t src[], int srcRB) { 4354560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int sumW = srcW + 1; 4364560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com 4374560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com SkASSERT(srcRB >= srcW); 4388a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com // mod srcRB so we can apply it after each row 4394560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com srcRB -= srcW; 4408a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 4418a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com int x, y; 4428a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 4434560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com // zero out the top row and column 4444560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com memset(sum, 0, sumW * sizeof(sum[0])); 4454560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com sum += sumW; 4464560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com 4478a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com // special case first row 4488a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com uint32_t X = 0; 4494560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com *sum++ = 0; // initialze the first column to 0 45003016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com for (x = srcW - 1; x >= 0; --x) { 4518a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com X = *src++ + X; 4524560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com *sum++ = X; 4538a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 4548a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com src += srcRB; 4558a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 4568a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com // now do the rest of the rows 45703016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com for (y = srcH - 1; y > 0; --y) { 4588a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com uint32_t L = 0; 4598a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com uint32_t C = 0; 4604560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com *sum++ = 0; // initialze the first column to 0 46101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com 46201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com for (x = srcW - 1; !SkIsAlign4((intptr_t) src) && x >= 0; x--) { 46301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com uint32_t T = sum[-sumW]; 46401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com X = *src++ + L + T - C; 46501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *sum++ = X; 46601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com L = X; 46701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com C = T; 46801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com } 46901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com 47001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com for (; x >= 4; x-=4) { 47101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com uint32_t T = sum[-sumW]; 47201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com X = *src++ + L + T - C; 47301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *sum++ = X; 47401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com L = X; 47501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com C = T; 47601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com T = sum[-sumW]; 47701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com X = *src++ + L + T - C; 47801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *sum++ = X; 47901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com L = X; 48001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com C = T; 48101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com T = sum[-sumW]; 48201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com X = *src++ + L + T - C; 48301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *sum++ = X; 48401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com L = X; 48501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com C = T; 48601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com T = sum[-sumW]; 48701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com X = *src++ + L + T - C; 48801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *sum++ = X; 48901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com L = X; 49001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com C = T; 49101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com } 49201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com 49301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com for (; x >= 0; --x) { 4944560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com uint32_t T = sum[-sumW]; 4958a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com X = *src++ + L + T - C; 4964560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com *sum++ = X; 4978a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com L = X; 4988a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com C = T; 4998a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 5008a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com src += srcRB; 5018a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 5028a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com} 5038a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 50403016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com/** 5058caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * This is the path for apply_kernel() to be taken when the kernel 5068caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * is wider than the source image. 5078caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com */ 5088caac6447dd68655b57dfe876626a9733b191416tomhudson@google.comstatic void kernel_clamped(uint8_t dst[], int rx, int ry, const uint32_t sum[], 5098caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int sw, int sh) { 5108caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(2*rx > sw); 5118caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5128caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t scale = (1 << 24) / ((2*rx + 1)*(2*ry + 1)); 5138caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5148caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int sumStride = sw + 1; 5158caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5168caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int dw = sw + 2*rx; 5178caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int dh = sh + 2*ry; 5188caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5198caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int prev_y = -2*ry; 5208caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int next_y = 1; 5218caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5228caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com for (int y = 0; y < dh; y++) { 5238caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int py = SkClampPos(prev_y) * sumStride; 5248caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int ny = SkFastMin32(next_y, sh) * sumStride; 5258caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5268caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int prev_x = -2*rx; 5278caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int next_x = 1; 5288caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5298caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com for (int x = 0; x < dw; x++) { 5308caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int px = SkClampPos(prev_x); 5318caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int nx = SkFastMin32(next_x, sw); 5328caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5338caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t tmp = sum[px+py] + sum[nx+ny] - sum[nx+py] - sum[px+ny]; 5348caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *dst++ = SkToU8(tmp * scale >> 24); 5358caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5368caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com prev_x += 1; 5378caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com next_x += 1; 5388caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com } 5398caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5408caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com prev_y += 1; 5418caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com next_y += 1; 5428caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com } 5438caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com} 5448caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com/** 54503016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com * sw and sh are the width and height of the src. Since the sum buffer 54603016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com * matches that, but has an extra row and col at the beginning (with zeros), 54703016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com * we can just use sw and sh as our "max" values for pinning coordinates 54803016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com * when sampling into sum[][] 5498caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * 5508caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * The inner loop is conceptually simple; we break it into several sections 5518caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * to improve performance. Here's the original version: 5528caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com for (int x = 0; x < dw; x++) { 5538caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int px = SkClampPos(prev_x); 5548caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int nx = SkFastMin32(next_x, sw); 5558caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5568caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t tmp = sum[px+py] + sum[nx+ny] - sum[nx+py] - sum[px+ny]; 5578caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *dst++ = SkToU8(tmp * scale >> 24); 5588caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5598caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com prev_x += 1; 5608caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com next_x += 1; 5618caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com } 56201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com * The sections are: 56301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com * left-hand section, where prev_x is clamped to 0 56401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com * center section, where neither prev_x nor next_x is clamped 56501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com * right-hand section, where next_x is clamped to sw 56601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com * On some operating systems, the center section is unrolled for additional 56701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com * speedup. 5688caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com*/ 5694560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.comstatic void apply_kernel(uint8_t dst[], int rx, int ry, const uint32_t sum[], 5704560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int sw, int sh) { 5718caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com if (2*rx > sw) { 5728caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com kernel_clamped(dst, rx, ry, sum, sw, sh); 5738caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com return; 5748caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com } 5758caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5768a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com uint32_t scale = (1 << 24) / ((2*rx + 1)*(2*ry + 1)); 5778a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 5784560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int sumStride = sw + 1; 5798a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 5808a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com int dw = sw + 2*rx; 5818a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com int dh = sh + 2*ry; 5828a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 5834560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int prev_y = -2*ry; 5844560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int next_y = 1; 5858a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 5868caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(2*rx <= dw - 2*rx); 5878caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5884560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com for (int y = 0; y < dh; y++) { 5894560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int py = SkClampPos(prev_y) * sumStride; 5904560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int ny = SkFastMin32(next_y, sh) * sumStride; 5918a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 5924560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int prev_x = -2*rx; 5934560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int next_x = 1; 5948caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int x = 0; 5958caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 5968caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com for (; x < 2*rx; x++) { 5978caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(prev_x <= 0); 5988caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(next_x <= sw); 5998caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 6008caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int px = 0; 6018caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int nx = next_x; 6028caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 6038caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t tmp = sum[px+py] + sum[nx+ny] - sum[nx+py] - sum[px+ny]; 6048caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *dst++ = SkToU8(tmp * scale >> 24); 6058caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 6068caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com prev_x += 1; 6078caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com next_x += 1; 6088caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com } 6098caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 61001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com int i0 = prev_x + py; 61101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com int i1 = next_x + ny; 61201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com int i2 = next_x + py; 61301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com int i3 = prev_x + ny; 61401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com 61501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#if UNROLL_KERNEL_LOOP 61601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com for (; x < dw - 2*rx - 4; x += 4) { 6178caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(prev_x >= 0); 6188caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(next_x <= sw); 6198caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 62001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com uint32_t tmp = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++]; 62101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *dst++ = SkToU8(tmp * scale >> 24); 62201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com tmp = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++]; 62301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *dst++ = SkToU8(tmp * scale >> 24); 62401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com tmp = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++]; 62501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *dst++ = SkToU8(tmp * scale >> 24); 62601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com tmp = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++]; 62701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *dst++ = SkToU8(tmp * scale >> 24); 6288caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 62901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com prev_x += 4; 63001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com next_x += 4; 63101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com } 63201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#endif 63301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com 63401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com for (; x < dw - 2*rx; x++) { 63501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com SkASSERT(prev_x >= 0); 63601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com SkASSERT(next_x <= sw); 63701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com 63801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com uint32_t tmp = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++]; 6398caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *dst++ = SkToU8(tmp * scale >> 24); 6408caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 6418caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com prev_x += 1; 6428caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com next_x += 1; 6438caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com } 6448caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 6458caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com for (; x < dw; x++) { 6468caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(prev_x >= 0); 6478caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(next_x > sw); 6488caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 6498caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int px = prev_x; 6508caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int nx = sw; 6518caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 6528caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t tmp = sum[px+py] + sum[nx+ny] - sum[nx+py] - sum[px+ny]; 6538caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *dst++ = SkToU8(tmp * scale >> 24); 6548caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 6558caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com prev_x += 1; 6568caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com next_x += 1; 6578caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com } 6588caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 6598caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com prev_y += 1; 6608caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com next_y += 1; 6618caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com } 6628caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com} 6638caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 6648caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com/** 6658caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * This is the path for apply_kernel_interp() to be taken when the kernel 6668caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * is wider than the source image. 6678caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com */ 6688caac6447dd68655b57dfe876626a9733b191416tomhudson@google.comstatic void kernel_interp_clamped(uint8_t dst[], int rx, int ry, 6698caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com const uint32_t sum[], int sw, int sh, U8CPU outer_weight) { 6708caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(2*rx > sw); 6718caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 6728caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int inner_weight = 255 - outer_weight; 6738caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 6748caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com // round these guys up if they're bigger than 127 6758caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com outer_weight += outer_weight >> 7; 6768caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com inner_weight += inner_weight >> 7; 6778caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 6788caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t outer_scale = (outer_weight << 16) / ((2*rx + 1)*(2*ry + 1)); 6798caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t inner_scale = (inner_weight << 16) / ((2*rx - 1)*(2*ry - 1)); 6808caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 6818caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int sumStride = sw + 1; 6828caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 6838caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int dw = sw + 2*rx; 6848caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int dh = sh + 2*ry; 6858caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 6868caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int prev_y = -2*ry; 6878caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int next_y = 1; 6888caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 6898caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com for (int y = 0; y < dh; y++) { 6908caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int py = SkClampPos(prev_y) * sumStride; 6918caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int ny = SkFastMin32(next_y, sh) * sumStride; 6928caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 6938caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int ipy = SkClampPos(prev_y + 1) * sumStride; 6948caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int iny = SkClampMax(next_y - 1, sh) * sumStride; 6958caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 6968caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int prev_x = -2*rx; 6978caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int next_x = 1; 6988a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 6994560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com for (int x = 0; x < dw; x++) { 7008a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com int px = SkClampPos(prev_x); 7018a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com int nx = SkFastMin32(next_x, sw); 7028a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 7038caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int ipx = SkClampPos(prev_x + 1); 7048caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int inx = SkClampMax(next_x - 1, sw); 7058caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 7068caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t outer_sum = sum[px+py] + sum[nx+ny] 7078caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com - sum[nx+py] - sum[px+ny]; 7088caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t inner_sum = sum[ipx+ipy] + sum[inx+iny] 7098caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com - sum[inx+ipy] - sum[ipx+iny]; 7108caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *dst++ = SkToU8((outer_sum * outer_scale 7118caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com + inner_sum * inner_scale) >> 24); 7128a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 7138a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com prev_x += 1; 7148a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com next_x += 1; 7158a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 7168a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com prev_y += 1; 7178a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com next_y += 1; 7188a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 7198a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com} 7208a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 72103016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com/** 72203016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com * sw and sh are the width and height of the src. Since the sum buffer 72303016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com * matches that, but has an extra row and col at the beginning (with zeros), 72403016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com * we can just use sw and sh as our "max" values for pinning coordinates 72503016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com * when sampling into sum[][] 7268caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * 7278caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * The inner loop is conceptually simple; we break it into several variants 7288caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com * to improve performance. Here's the original version: 7298caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com for (int x = 0; x < dw; x++) { 7308caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int px = SkClampPos(prev_x); 7318caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int nx = SkFastMin32(next_x, sw); 7328caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 7338caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int ipx = SkClampPos(prev_x + 1); 7348caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int inx = SkClampMax(next_x - 1, sw); 7358caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 7368caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t outer_sum = sum[px+py] + sum[nx+ny] 7378caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com - sum[nx+py] - sum[px+ny]; 7388caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t inner_sum = sum[ipx+ipy] + sum[inx+iny] 7398caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com - sum[inx+ipy] - sum[ipx+iny]; 7408caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *dst++ = SkToU8((outer_sum * outer_scale 7418caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com + inner_sum * inner_scale) >> 24); 7428caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 7438caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com prev_x += 1; 7448caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com next_x += 1; 7458caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com } 74601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com * The sections are: 74701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com * left-hand section, where prev_x is clamped to 0 74801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com * center section, where neither prev_x nor next_x is clamped 74901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com * right-hand section, where next_x is clamped to sw 75001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com * On some operating systems, the center section is unrolled for additional 75101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com * speedup. 7528caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com*/ 7534560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.comstatic void apply_kernel_interp(uint8_t dst[], int rx, int ry, 7544560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com const uint32_t sum[], int sw, int sh, U8CPU outer_weight) { 7558a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com SkASSERT(rx > 0 && ry > 0); 7568a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com SkASSERT(outer_weight <= 255); 7578a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 7588caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com if (2*rx > sw) { 7598caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com kernel_interp_clamped(dst, rx, ry, sum, sw, sh, outer_weight); 7608caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com return; 7618caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com } 7628caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 7638a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com int inner_weight = 255 - outer_weight; 7648a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 7658a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com // round these guys up if they're bigger than 127 7668a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com outer_weight += outer_weight >> 7; 7678a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com inner_weight += inner_weight >> 7; 7688a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 7698a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com uint32_t outer_scale = (outer_weight << 16) / ((2*rx + 1)*(2*ry + 1)); 7708a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com uint32_t inner_scale = (inner_weight << 16) / ((2*rx - 1)*(2*ry - 1)); 7718a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 7724560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int sumStride = sw + 1; 7738a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 7748a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com int dw = sw + 2*rx; 7758a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com int dh = sh + 2*ry; 7768a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 7774560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int prev_y = -2*ry; 7784560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int next_y = 1; 7798a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 7808caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(2*rx <= dw - 2*rx); 7818caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 7824560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com for (int y = 0; y < dh; y++) { 7834560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int py = SkClampPos(prev_y) * sumStride; 7844560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int ny = SkFastMin32(next_y, sh) * sumStride; 7858a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 7864560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int ipy = SkClampPos(prev_y + 1) * sumStride; 7874560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int iny = SkClampMax(next_y - 1, sh) * sumStride; 7888a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 7894560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int prev_x = -2*rx; 7904560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com int next_x = 1; 7918caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int x = 0; 7928a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 7938caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com for (; x < 2*rx; x++) { 7948caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(prev_x < 0); 7958caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(next_x <= sw); 7968a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 7978caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int px = 0; 7988caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int nx = next_x; 7998caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 8008caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int ipx = 0; 8018caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int inx = next_x - 1; 8028caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 8038caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t outer_sum = sum[px+py] + sum[nx+ny] 8048caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com - sum[nx+py] - sum[px+ny]; 8058caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t inner_sum = sum[ipx+ipy] + sum[inx+iny] 8068caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com - sum[inx+ipy] - sum[ipx+iny]; 8078caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *dst++ = SkToU8((outer_sum * outer_scale 8088caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com + inner_sum * inner_scale) >> 24); 8098caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 8108caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com prev_x += 1; 8118caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com next_x += 1; 8128caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com } 8138caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 81401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com int i0 = prev_x + py; 81501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com int i1 = next_x + ny; 81601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com int i2 = next_x + py; 81701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com int i3 = prev_x + ny; 81801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com int i4 = prev_x + 1 + ipy; 81901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com int i5 = next_x - 1 + iny; 82001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com int i6 = next_x - 1 + ipy; 82101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com int i7 = prev_x + 1 + iny; 82201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com 82301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#if UNROLL_KERNEL_LOOP 82401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com for (; x < dw - 2*rx - 4; x += 4) { 8258caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(prev_x >= 0); 8268caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(next_x <= sw); 8278caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 82801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com uint32_t outer_sum = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++]; 82901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com uint32_t inner_sum = sum[i4++] + sum[i5++] - sum[i6++] - sum[i7++]; 83001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *dst++ = SkToU8((outer_sum * outer_scale 83101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com + inner_sum * inner_scale) >> 24); 83201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com outer_sum = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++]; 83301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com inner_sum = sum[i4++] + sum[i5++] - sum[i6++] - sum[i7++]; 83401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *dst++ = SkToU8((outer_sum * outer_scale 83501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com + inner_sum * inner_scale) >> 24); 83601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com outer_sum = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++]; 83701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com inner_sum = sum[i4++] + sum[i5++] - sum[i6++] - sum[i7++]; 83801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *dst++ = SkToU8((outer_sum * outer_scale 83901224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com + inner_sum * inner_scale) >> 24); 84001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com outer_sum = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++]; 84101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com inner_sum = sum[i4++] + sum[i5++] - sum[i6++] - sum[i7++]; 84201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com *dst++ = SkToU8((outer_sum * outer_scale 84301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com + inner_sum * inner_scale) >> 24); 8448caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 84501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com prev_x += 4; 84601224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com next_x += 4; 84701224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com } 84801224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com#endif 8498a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 85001224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com for (; x < dw - 2*rx; x++) { 85101224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com SkASSERT(prev_x >= 0); 85201224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com SkASSERT(next_x <= sw); 85301224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com 85401224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com uint32_t outer_sum = sum[i0++] + sum[i1++] - sum[i2++] - sum[i3++]; 85501224d5d0a3228fe47e63d8346e0e433a87563a8tomhudson@google.com uint32_t inner_sum = sum[i4++] + sum[i5++] - sum[i6++] - sum[i7++]; 8568caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *dst++ = SkToU8((outer_sum * outer_scale 8578caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com + inner_sum * inner_scale) >> 24); 8588a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 8598a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com prev_x += 1; 8608a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com next_x += 1; 8618a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 8628caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 8638caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com for (; x < dw; x++) { 8648caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(prev_x >= 0); 8658caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com SkASSERT(next_x > sw); 8668caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 8678caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int px = prev_x; 8688caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int nx = sw; 8698caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 8708caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int ipx = prev_x + 1; 8718caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com int inx = sw; 8728caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 8738caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t outer_sum = sum[px+py] + sum[nx+ny] 8748caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com - sum[nx+py] - sum[px+ny]; 8758caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com uint32_t inner_sum = sum[ipx+ipy] + sum[inx+iny] 8768caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com - sum[inx+ipy] - sum[ipx+iny]; 8778caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com *dst++ = SkToU8((outer_sum * outer_scale 8788caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com + inner_sum * inner_scale) >> 24); 8798caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 8808caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com prev_x += 1; 8818caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com next_x += 1; 8828caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com } 8838caac6447dd68655b57dfe876626a9733b191416tomhudson@google.com 8848a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com prev_y += 1; 8858a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com next_y += 1; 8868a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 8878a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com} 8888a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 8898a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com#include "SkColorPriv.h" 8908a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 8910e3c664250f561ec9f7107b92136517a72d03afdreed@android.comstatic void merge_src_with_blur(uint8_t dst[], int dstRB, 8920e3c664250f561ec9f7107b92136517a72d03afdreed@android.com const uint8_t src[], int srcRB, 8930e3c664250f561ec9f7107b92136517a72d03afdreed@android.com const uint8_t blur[], int blurRB, 8940e3c664250f561ec9f7107b92136517a72d03afdreed@android.com int sw, int sh) { 8950e3c664250f561ec9f7107b92136517a72d03afdreed@android.com dstRB -= sw; 8960e3c664250f561ec9f7107b92136517a72d03afdreed@android.com srcRB -= sw; 8970e3c664250f561ec9f7107b92136517a72d03afdreed@android.com blurRB -= sw; 8980e3c664250f561ec9f7107b92136517a72d03afdreed@android.com while (--sh >= 0) { 8990e3c664250f561ec9f7107b92136517a72d03afdreed@android.com for (int x = sw - 1; x >= 0; --x) { 9008a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com *dst = SkToU8(SkAlphaMul(*blur, SkAlpha255To256(*src))); 9018a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com dst += 1; 9028a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com src += 1; 9038a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com blur += 1; 9048a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 9050e3c664250f561ec9f7107b92136517a72d03afdreed@android.com dst += dstRB; 9060e3c664250f561ec9f7107b92136517a72d03afdreed@android.com src += srcRB; 9070e3c664250f561ec9f7107b92136517a72d03afdreed@android.com blur += blurRB; 9088a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 9098a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com} 9108a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 9118a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.comstatic void clamp_with_orig(uint8_t dst[], int dstRowBytes, 9120e3c664250f561ec9f7107b92136517a72d03afdreed@android.com const uint8_t src[], int srcRowBytes, 9130e3c664250f561ec9f7107b92136517a72d03afdreed@android.com int sw, int sh, 9144560767bb0b3db530d48e2b0c1c11e28f3692984reed@android.com SkBlurMask::Style style) { 9158a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com int x; 9160e3c664250f561ec9f7107b92136517a72d03afdreed@android.com while (--sh >= 0) { 9178a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com switch (style) { 9188a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com case SkBlurMask::kSolid_Style: 9190e3c664250f561ec9f7107b92136517a72d03afdreed@android.com for (x = sw - 1; x >= 0; --x) { 9200e3c664250f561ec9f7107b92136517a72d03afdreed@android.com int s = *src; 9210e3c664250f561ec9f7107b92136517a72d03afdreed@android.com int d = *dst; 9220e3c664250f561ec9f7107b92136517a72d03afdreed@android.com *dst = SkToU8(s + d - SkMulDiv255Round(s, d)); 9238a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com dst += 1; 9248a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com src += 1; 9258a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 9268a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com break; 9278a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com case SkBlurMask::kOuter_Style: 9280e3c664250f561ec9f7107b92136517a72d03afdreed@android.com for (x = sw - 1; x >= 0; --x) { 9290e3c664250f561ec9f7107b92136517a72d03afdreed@android.com if (*src) { 9308a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com *dst = SkToU8(SkAlphaMul(*dst, SkAlpha255To256(255 - *src))); 9310e3c664250f561ec9f7107b92136517a72d03afdreed@android.com } 9328a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com dst += 1; 9338a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com src += 1; 9348a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 9358a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com break; 9368a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com default: 9370c00f21fee3f5cfa3aa7e5d46ff94cb8cf340451tomhudson@google.com SkDEBUGFAIL("Unexpected blur style here"); 9388a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com break; 9398a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 9408a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com dst += dstRowBytes - sw; 9410e3c664250f561ec9f7107b92136517a72d03afdreed@android.com src += srcRowBytes - sw; 9428a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 9438a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com} 9448a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 94503016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com/////////////////////////////////////////////////////////////////////////////// 9468a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 94733cdbdea3ddcec9323b65eace86e10557312ae9bbsalomon@google.com// we use a local function to wrap the class static method to work around 9488a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com// a bug in gcc98 9498a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.comvoid SkMask_FreeImage(uint8_t* image); 95003016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.comvoid SkMask_FreeImage(uint8_t* image) { 9518a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com SkMask::FreeImage(image); 9528a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com} 9538a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 9548a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.combool SkBlurMask::Blur(SkMask* dst, const SkMask& src, 9555af16f8d670b3ce1c7644a4737e02e2e2257614ebungeman@google.com SkScalar radius, Style style, Quality quality, 95671f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org SkIPoint* margin, bool separable) 9575af16f8d670b3ce1c7644a4737e02e2e2257614ebungeman@google.com{ 95803016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com if (src.fFormat != SkMask::kA8_Format) { 9598a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com return false; 96003016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com } 9618a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 9624868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org // Force high quality off for small radii (performance) 96391f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org if (radius < SkIntToScalar(3)) { 96491f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org quality = kLow_Quality; 96591f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org } 9664868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org 9674868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org // highQuality: use three box blur passes as a cheap way to approximate a Gaussian blur 96891f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org int passCount = (kHigh_Quality == quality) ? 3 : 1; 9697c7292c6071898d73dc935c3b66b9816183806f0humper@google.com SkScalar passRadius = (kHigh_Quality == quality) ? SkScalarMul( radius, kBlurRadiusFudgeFactor): radius; 9704868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org 9714868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org int rx = SkScalarCeil(passRadius); 9724868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org int outer_weight = 255 - SkScalarRound((SkIntToScalar(rx) - passRadius) * 255); 9738a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 9748a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com SkASSERT(rx >= 0); 9758a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com SkASSERT((unsigned)outer_weight <= 255); 9760e3c664250f561ec9f7107b92136517a72d03afdreed@android.com if (rx <= 0) { 9778a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com return false; 9780e3c664250f561ec9f7107b92136517a72d03afdreed@android.com } 9798a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 9808a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com int ry = rx; // only do square blur for now 9818a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 9824868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org int padx = passCount * rx; 9834868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org int pady = passCount * ry; 9845af16f8d670b3ce1c7644a4737e02e2e2257614ebungeman@google.com if (margin) { 9855af16f8d670b3ce1c7644a4737e02e2e2257614ebungeman@google.com margin->set(padx, pady); 9865af16f8d670b3ce1c7644a4737e02e2e2257614ebungeman@google.com } 9874868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org dst->fBounds.set(src.fBounds.fLeft - padx, src.fBounds.fTop - pady, 9884868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org src.fBounds.fRight + padx, src.fBounds.fBottom + pady); 98949f0ff25a046d6001dc2d095b6fa3c30f0f46b6areed@android.com dst->fRowBytes = dst->fBounds.width(); 9908a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com dst->fFormat = SkMask::kA8_Format; 9918a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com dst->fImage = NULL; 9928a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 9930e3c664250f561ec9f7107b92136517a72d03afdreed@android.com if (src.fImage) { 994543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com size_t dstSize = dst->computeImageSize(); 995543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com if (0 == dstSize) { 996543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com return false; // too big to allocate, abort 997543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com } 998543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com 9998a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com int sw = src.fBounds.width(); 10008a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com int sh = src.fBounds.height(); 10018a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com const uint8_t* sp = src.fImage; 1002543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com uint8_t* dp = SkMask::AllocImage(dstSize); 10038a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 10048a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com SkAutoTCallVProc<uint8_t, SkMask_FreeImage> autoCall(dp); 10058a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 10068a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com // build the blurry destination 100771f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org if (separable) { 100871f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org SkAutoTMalloc<uint8_t> tmpBuffer(dstSize); 100971f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org uint8_t* tp = tmpBuffer.get(); 101071f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org int w = sw, h = sh; 101171f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org 101291f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org if (outer_weight == 255) { 1013c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org int loRadius, hiRadius; 1014c4381309649c5cf338dcf6a7fc8296451a686d6bsenorblanco@chromium.org get_adjusted_radii(passRadius, &loRadius, &hiRadius); 101591f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org if (kHigh_Quality == quality) { 101691f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org // Do three X blurs, with a transpose on the final one. 101791f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org w = boxBlur(sp, src.fRowBytes, tp, loRadius, hiRadius, w, h, false); 101891f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org w = boxBlur(tp, w, dp, hiRadius, loRadius, w, h, false); 101991f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org w = boxBlur(dp, w, tp, hiRadius, hiRadius, w, h, true); 102091f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org // Do three Y blurs, with a transpose on the final one. 102191f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org h = boxBlur(tp, h, dp, loRadius, hiRadius, h, w, false); 102291f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org h = boxBlur(dp, h, tp, hiRadius, loRadius, h, w, false); 102391f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org h = boxBlur(tp, h, dp, hiRadius, hiRadius, h, w, true); 102491f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org } else { 102591f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org w = boxBlur(sp, src.fRowBytes, tp, rx, rx, w, h, true); 102691f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org h = boxBlur(tp, h, dp, ry, ry, h, w, true); 102791f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org } 1028908276b3969cf8f8eec28026363897134c0e54e0senorblanco@chromium.org } else { 102991f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org if (kHigh_Quality == quality) { 103091f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org // Do three X blurs, with a transpose on the final one. 103191f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org w = boxBlurInterp(sp, src.fRowBytes, tp, rx, w, h, false, outer_weight); 103291f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org w = boxBlurInterp(tp, w, dp, rx, w, h, false, outer_weight); 103391f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org w = boxBlurInterp(dp, w, tp, rx, w, h, true, outer_weight); 103491f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org // Do three Y blurs, with a transpose on the final one. 103591f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org h = boxBlurInterp(tp, h, dp, ry, h, w, false, outer_weight); 103691f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org h = boxBlurInterp(dp, h, tp, ry, h, w, false, outer_weight); 103791f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org h = boxBlurInterp(tp, h, dp, ry, h, w, true, outer_weight); 103891f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org } else { 103991f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org w = boxBlurInterp(sp, src.fRowBytes, tp, rx, w, h, true, outer_weight); 104091f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org h = boxBlurInterp(tp, h, dp, ry, h, w, true, outer_weight); 104191f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org } 104271f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org } 104371f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org } else { 104403016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com const size_t storageW = sw + 2 * (passCount - 1) * rx + 1; 104503016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com const size_t storageH = sh + 2 * (passCount - 1) * ry + 1; 104603016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com SkAutoTMalloc<uint32_t> storage(storageW * storageH); 10478a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com uint32_t* sumBuffer = storage.get(); 10488a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 10494868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org //pass1: sp is source, dp is destination 10508a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com build_sum_buffer(sumBuffer, sw, sh, sp, src.fRowBytes); 105103016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com if (outer_weight == 255) { 10528a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com apply_kernel(dp, rx, ry, sumBuffer, sw, sh); 105303016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com } else { 10548a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com apply_kernel_interp(dp, rx, ry, sumBuffer, sw, sh, outer_weight); 105503016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com } 10564868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org 105791f489a65d436d36c7fe580af2775cd0cd13c8d2senorblanco@chromium.org if (kHigh_Quality == quality) { 10584868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org //pass2: dp is source, tmpBuffer is destination 10594868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org int tmp_sw = sw + 2 * rx; 10604868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org int tmp_sh = sh + 2 * ry; 10614868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org SkAutoTMalloc<uint8_t> tmpBuffer(dstSize); 10624868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org build_sum_buffer(sumBuffer, tmp_sw, tmp_sh, dp, tmp_sw); 10634868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org if (outer_weight == 255) 10644868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org apply_kernel(tmpBuffer.get(), rx, ry, sumBuffer, tmp_sw, tmp_sh); 10654868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org else 106603016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com apply_kernel_interp(tmpBuffer.get(), rx, ry, sumBuffer, 106703016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com tmp_sw, tmp_sh, outer_weight); 10684868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org 10694868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org //pass3: tmpBuffer is source, dp is destination 10704868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org tmp_sw += 2 * rx; 10714868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org tmp_sh += 2 * ry; 10724868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org build_sum_buffer(sumBuffer, tmp_sw, tmp_sh, tmpBuffer.get(), tmp_sw); 10734868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org if (outer_weight == 255) 10744868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org apply_kernel(dp, rx, ry, sumBuffer, tmp_sw, tmp_sh); 10754868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org else 107603016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com apply_kernel_interp(dp, rx, ry, sumBuffer, tmp_sw, tmp_sh, 107703016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com outer_weight); 10784868e6b221a4a98e40f977851af5fcf09631ea15senorblanco@chromium.org } 10798a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 10808a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 10818a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com dst->fImage = dp; 10828a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com // if need be, alloc the "real" dst (same size as src) and copy/merge 10838a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com // the blur into it (applying the src) 10840e3c664250f561ec9f7107b92136517a72d03afdreed@android.com if (style == kInner_Style) { 10850e3c664250f561ec9f7107b92136517a72d03afdreed@android.com // now we allocate the "real" dst, mirror the size of src 1086543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com size_t srcSize = src.computeImageSize(); 1087543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com if (0 == srcSize) { 1088543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com return false; // too big to allocate, abort 1089543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com } 1090543ed9352c7dfd93071c08b14930cca2e82a08d4reed@android.com dst->fImage = SkMask::AllocImage(srcSize); 10910e3c664250f561ec9f7107b92136517a72d03afdreed@android.com merge_src_with_blur(dst->fImage, src.fRowBytes, 10920e3c664250f561ec9f7107b92136517a72d03afdreed@android.com sp, src.fRowBytes, 109303016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com dp + passCount * (rx + ry * dst->fRowBytes), 109403016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com dst->fRowBytes, sw, sh); 10958a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com SkMask::FreeImage(dp); 10960e3c664250f561ec9f7107b92136517a72d03afdreed@android.com } else if (style != kNormal_Style) { 109703016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com clamp_with_orig(dp + passCount * (rx + ry * dst->fRowBytes), 109803016a36206be42e91e8e0eb62fe8fb95da97b38reed@google.com dst->fRowBytes, sp, src.fRowBytes, sw, sh, style); 10998a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 11008a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com (void)autoCall.detach(); 11018a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 11028a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 11030e3c664250f561ec9f7107b92136517a72d03afdreed@android.com if (style == kInner_Style) { 11048a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com dst->fBounds = src.fBounds; // restore trimmed bounds 11050e3c664250f561ec9f7107b92136517a72d03afdreed@android.com dst->fRowBytes = src.fRowBytes; 11068a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com } 11078a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 11088a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com return true; 11098a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com} 11108a1c16ff38322f0210116fa7293eb8817c7e477ereed@android.com 111171f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.orgbool SkBlurMask::BlurSeparable(SkMask* dst, const SkMask& src, 111271f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org SkScalar radius, Style style, Quality quality, 111371f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org SkIPoint* margin) 111471f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org{ 111571f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org return SkBlurMask::Blur(dst, src, radius, style, quality, margin, true); 111671f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org} 111771f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org 111871f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.orgbool SkBlurMask::Blur(SkMask* dst, const SkMask& src, 111971f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org SkScalar radius, Style style, Quality quality, 112071f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org SkIPoint* margin) 112171f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org{ 112271f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org return SkBlurMask::Blur(dst, src, radius, style, quality, margin, false); 112371f0f34f7d8e80fe760f318f29ba88ab58baff7dsenorblanco@chromium.org} 11247c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 11257c7292c6071898d73dc935c3b66b9816183806f0humper@google.com/* Convolving a box with itself three times results in a piecewise 11267c7292c6071898d73dc935c3b66b9816183806f0humper@google.com quadratic function: 11278ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 11287c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 0 x <= -1.5 11297c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 9/8 + 3/2 x + 1/2 x^2 -1.5 < x <= 1.5 11307c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 3/4 - x^2 -.5 < x <= .5 11317c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 9/8 - 3/2 x + 1/2 x^2 0.5 < x <= 1.5 11327c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 0 1.5 < x 11338ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 11347c7292c6071898d73dc935c3b66b9816183806f0humper@google.com To get the profile curve of the blurred step function at the rectangle 11357c7292c6071898d73dc935c3b66b9816183806f0humper@google.com edge, we evaluate the indefinite integral, which is piecewise cubic: 11368ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 11377c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 0 x <= -1.5 11387c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 5/8 + 9/8 x + 3/4 x^2 + 1/6 x^3 -1.5 < x <= -0.5 11397c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 1/2 + 3/4 x - 1/3 x^3 -.5 < x <= .5 11407c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 3/8 + 9/8 x - 3/4 x^2 + 1/6 x^3 .5 < x <= 1.5 11417c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 1 1.5 < x 11427c7292c6071898d73dc935c3b66b9816183806f0humper@google.com*/ 11437c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 11447c7292c6071898d73dc935c3b66b9816183806f0humper@google.comstatic float gaussian_integral( float x ) { 11457c7292c6071898d73dc935c3b66b9816183806f0humper@google.com if ( x > 1.5f ) { 11467c7292c6071898d73dc935c3b66b9816183806f0humper@google.com return 0.0f; 11477c7292c6071898d73dc935c3b66b9816183806f0humper@google.com } 11487c7292c6071898d73dc935c3b66b9816183806f0humper@google.com if ( x < -1.5f ) { 11497c7292c6071898d73dc935c3b66b9816183806f0humper@google.com return 1.0f; 11507c7292c6071898d73dc935c3b66b9816183806f0humper@google.com } 11517c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 11527c7292c6071898d73dc935c3b66b9816183806f0humper@google.com float x2 = x*x; 11537c7292c6071898d73dc935c3b66b9816183806f0humper@google.com float x3 = x2*x; 11547c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 11559c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com if ( x > 0.5f ) { 11569c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com return 0.5625f - ( x3 / 6.0f - 3.0f * x2 * 0.25f + 1.125f * x); 11577c7292c6071898d73dc935c3b66b9816183806f0humper@google.com } 11589c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com if ( x > -0.5f ) { 11599c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com return 0.5f - (0.75f * x - x3 / 3.0f); 11607c7292c6071898d73dc935c3b66b9816183806f0humper@google.com } 11619c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com return 0.4375f + (-x3 / 6.0f - 3.0f * x2 * 0.25f - 1.125f * x); 11627c7292c6071898d73dc935c3b66b9816183806f0humper@google.com} 11637c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 11648ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com/* 11657c7292c6071898d73dc935c3b66b9816183806f0humper@google.com compute_profile allocates and fills in an array of floating 11668ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com point values between 0 and 255 for the profile signature of 11677c7292c6071898d73dc935c3b66b9816183806f0humper@google.com a blurred half-plane with the given blur radius. Since we're 11687c7292c6071898d73dc935c3b66b9816183806f0humper@google.com going to be doing screened multiplications (i.e., 1 - (1-x)(1-y)) 11697c7292c6071898d73dc935c3b66b9816183806f0humper@google.com all the time, we actually fill in the profile pre-inverted 11707c7292c6071898d73dc935c3b66b9816183806f0humper@google.com (already done 255-x). 11718ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 11727c7292c6071898d73dc935c3b66b9816183806f0humper@google.com The function returns the size of the array allocated for the 11738ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com profile. It's the responsibility of the caller to delete the 11747c7292c6071898d73dc935c3b66b9816183806f0humper@google.com memory returned in profile_out. 11757c7292c6071898d73dc935c3b66b9816183806f0humper@google.com*/ 11767c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 11777c7292c6071898d73dc935c3b66b9816183806f0humper@google.comstatic int compute_profile( SkScalar radius, unsigned int **profile_out ) { 11789c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com int size = SkScalarFloorToInt(radius * 3 + 1); 11797c7292c6071898d73dc935c3b66b9816183806f0humper@google.com int center = size >> 1; 11807c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 118133cdbdea3ddcec9323b65eace86e10557312ae9bbsalomon@google.com unsigned int *profile = SkNEW_ARRAY(unsigned int, size); 11827c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 11837c7292c6071898d73dc935c3b66b9816183806f0humper@google.com float invr = 1.0f/radius; 11847c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 11857c7292c6071898d73dc935c3b66b9816183806f0humper@google.com profile[0] = 255; 11867c7292c6071898d73dc935c3b66b9816183806f0humper@google.com for (int x = 1 ; x < size ; x++) { 11877c7292c6071898d73dc935c3b66b9816183806f0humper@google.com float scaled_x = ( center - x ) * invr; 11887c7292c6071898d73dc935c3b66b9816183806f0humper@google.com float gi = gaussian_integral( scaled_x ); 11897c7292c6071898d73dc935c3b66b9816183806f0humper@google.com profile[x] = 255 - (uint8_t) ( 255.f * gi ); 11907c7292c6071898d73dc935c3b66b9816183806f0humper@google.com } 11917c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 11927c7292c6071898d73dc935c3b66b9816183806f0humper@google.com *profile_out = profile; 11937c7292c6071898d73dc935c3b66b9816183806f0humper@google.com return size; 11947c7292c6071898d73dc935c3b66b9816183806f0humper@google.com} 11957c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 11968ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com// TODO MAYBE: Maintain a profile cache to avoid recomputing this for 11977c7292c6071898d73dc935c3b66b9816183806f0humper@google.com// commonly used radii. Consider baking some of the most common blur radii 11987c7292c6071898d73dc935c3b66b9816183806f0humper@google.com// directly in as static data? 11997c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 12007c7292c6071898d73dc935c3b66b9816183806f0humper@google.com// Implementation adapted from Michael Herf's approach: 12017c7292c6071898d73dc935c3b66b9816183806f0humper@google.com// http://stereopsis.com/shadowrect/ 12027c7292c6071898d73dc935c3b66b9816183806f0humper@google.com 12037c7292c6071898d73dc935c3b66b9816183806f0humper@google.combool SkBlurMask::BlurRect(SkMask *dst, const SkRect &src, 12047c7292c6071898d73dc935c3b66b9816183806f0humper@google.com SkScalar provided_radius, Style style, Quality quality, 12057c7292c6071898d73dc935c3b66b9816183806f0humper@google.com SkIPoint *margin) { 12067c7292c6071898d73dc935c3b66b9816183806f0humper@google.com int profile_size; 12077c7292c6071898d73dc935c3b66b9816183806f0humper@google.com unsigned int *profile; 12088ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 12098ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 12107c7292c6071898d73dc935c3b66b9816183806f0humper@google.com float radius = SkScalarToFloat( SkScalarMul( provided_radius, kBlurRadiusFudgeFactor ) ); 12118ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 12127c7292c6071898d73dc935c3b66b9816183806f0humper@google.com profile_size = compute_profile( radius, &profile ); 121333cdbdea3ddcec9323b65eace86e10557312ae9bbsalomon@google.com SkAutoTDeleteArray<unsigned int> ada(profile); 12148ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 12157c7292c6071898d73dc935c3b66b9816183806f0humper@google.com int pad = (int) (radius * 1.5f + 1); 12167c7292c6071898d73dc935c3b66b9816183806f0humper@google.com if (margin) { 12177c7292c6071898d73dc935c3b66b9816183806f0humper@google.com margin->set( pad, pad ); 12187c7292c6071898d73dc935c3b66b9816183806f0humper@google.com } 12199c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com dst->fBounds = SkIRect::MakeWH(SkScalarFloorToInt(src.width()), SkScalarFloorToInt(src.height())); 12207c7292c6071898d73dc935c3b66b9816183806f0humper@google.com dst->fBounds.outset(pad, pad); 12218ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 12227c7292c6071898d73dc935c3b66b9816183806f0humper@google.com dst->fRowBytes = dst->fBounds.width(); 12237c7292c6071898d73dc935c3b66b9816183806f0humper@google.com dst->fFormat = SkMask::kA8_Format; 12247c7292c6071898d73dc935c3b66b9816183806f0humper@google.com dst->fImage = NULL; 12258ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 12267c7292c6071898d73dc935c3b66b9816183806f0humper@google.com size_t dstSize = dst->computeImageSize(); 12277c7292c6071898d73dc935c3b66b9816183806f0humper@google.com if (0 == dstSize) { 12287c7292c6071898d73dc935c3b66b9816183806f0humper@google.com return false; // too big to allocate, abort 12297c7292c6071898d73dc935c3b66b9816183806f0humper@google.com } 12308ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 12319c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com int sw = SkScalarFloorToInt(src.width()); 12329c4e5ac5b7d32151d4d8ab1fb7ed443b35eb1254jvanverth@google.com int sh = SkScalarFloorToInt(src.height()); 12338ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 12347c7292c6071898d73dc935c3b66b9816183806f0humper@google.com uint8_t* dp = SkMask::AllocImage(dstSize); 12358ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 12367c7292c6071898d73dc935c3b66b9816183806f0humper@google.com dst->fImage = dp; 12378ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 12387c7292c6071898d73dc935c3b66b9816183806f0humper@google.com int dst_height = dst->fBounds.height(); 12397c7292c6071898d73dc935c3b66b9816183806f0humper@google.com int dst_width = dst->fBounds.width(); 12408ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 12417c7292c6071898d73dc935c3b66b9816183806f0humper@google.com // nearest odd number less than the profile size represents the center 12427c7292c6071898d73dc935c3b66b9816183806f0humper@google.com // of the (2x scaled) profile 12437c7292c6071898d73dc935c3b66b9816183806f0humper@google.com int center = ( profile_size & ~1 ) - 1; 12448ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 12457c7292c6071898d73dc935c3b66b9816183806f0humper@google.com int w = sw - center; 12467c7292c6071898d73dc935c3b66b9816183806f0humper@google.com int h = sh - center; 12478ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 12487c7292c6071898d73dc935c3b66b9816183806f0humper@google.com uint8_t *outptr = dp; 12498ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 12507c7292c6071898d73dc935c3b66b9816183806f0humper@google.com for (int y = 0 ; y < dst_height ; y++) 12517c7292c6071898d73dc935c3b66b9816183806f0humper@google.com { 12527c7292c6071898d73dc935c3b66b9816183806f0humper@google.com // time to fill in a scanline of the blurry rectangle. 12537c7292c6071898d73dc935c3b66b9816183806f0humper@google.com // to avoid floating point math, everything is multiplied by 12547c7292c6071898d73dc935c3b66b9816183806f0humper@google.com // 2 where needed. This keeps things nice and integer-oriented. 12558ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 12567c7292c6071898d73dc935c3b66b9816183806f0humper@google.com int dy = abs((y << 1) - dst_height) - h; // how far are we from the original edge? 12577c7292c6071898d73dc935c3b66b9816183806f0humper@google.com int oy = dy >> 1; 12587c7292c6071898d73dc935c3b66b9816183806f0humper@google.com if (oy < 0) oy = 0; 12598ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 12607c7292c6071898d73dc935c3b66b9816183806f0humper@google.com unsigned int profile_y = profile[oy]; 12618ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 12627c7292c6071898d73dc935c3b66b9816183806f0humper@google.com for (int x = 0 ; x < (dst_width << 1) ; x += 2) { 12637c7292c6071898d73dc935c3b66b9816183806f0humper@google.com int dx = abs( x - dst_width ) - w; 12647c7292c6071898d73dc935c3b66b9816183806f0humper@google.com int ox = dx >> 1; 12657c7292c6071898d73dc935c3b66b9816183806f0humper@google.com if (ox < 0) ox = 0; 12668ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 12677c7292c6071898d73dc935c3b66b9816183806f0humper@google.com unsigned int maskval = SkMulDiv255Round(profile[ox], profile_y); 12688ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 12697c7292c6071898d73dc935c3b66b9816183806f0humper@google.com *(outptr++) = maskval; 12707c7292c6071898d73dc935c3b66b9816183806f0humper@google.com } 12717c7292c6071898d73dc935c3b66b9816183806f0humper@google.com } 12728ae714b186ae5f4eaddee239281fbfe7282320c9skia.committer@gmail.com 12737c7292c6071898d73dc935c3b66b9816183806f0humper@google.com return true; 12747c7292c6071898d73dc935c3b66b9816183806f0humper@google.com} 1275