10d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams/* 20d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams * Copyright (C) 2014 The Android Open Source Project 30d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams * 40d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams * Licensed under the Apache License, Version 2.0 (the "License"); 50d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams * you may not use this file except in compliance with the License. 60d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams * You may obtain a copy of the License at 70d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams * 80d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams * http://www.apache.org/licenses/LICENSE-2.0 90d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams * 100d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams * Unless required by applicable law or agreed to in writing, software 110d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams * distributed under the License is distributed on an "AS IS" BASIS, 120d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 130d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams * See the License for the specific language governing permissions and 140d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams * limitations under the License. 150d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams */ 160d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams 170d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams#include "ip.rsh" 180d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams#pragma rs_fp_relaxed 190d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams 200d6043caef208ee6c661eb17bcb376abfe90cd48Jason Samsint32_t gWidthIn; 210d6043caef208ee6c661eb17bcb376abfe90cd48Jason Samsint32_t gHeightIn; 220d6043caef208ee6c661eb17bcb376abfe90cd48Jason Samsrs_allocation gIn; 230d6043caef208ee6c661eb17bcb376abfe90cd48Jason Samsfloat scale; 240d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams 250d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams 260d6043caef208ee6c661eb17bcb376abfe90cd48Jason Samsuchar4 __attribute__((kernel)) nearest(uint32_t x, uint32_t y) { 270d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams float xf = clamp(x * scale, 0.f, (float)gWidthIn - 1.f); 280d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams float yf = clamp(y * scale, 0.f, (float)gHeightIn - 1.f); 290d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams uint32_t ix = xf; 300d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams uint32_t iy = yf; 310d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams 320d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams uchar4 tmp = rsGetElementAt_uchar4(gIn, ix, iy); 330d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams tmp.a = 0xff; 340d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams return tmp; 350d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams} 360d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams 370d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams 380d6043caef208ee6c661eb17bcb376abfe90cd48Jason Samsstatic float4 cubicInterpolate (float4 p0,float4 p1,float4 p2,float4 p3 , float x) { 390d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams return p1 + 0.5f * x * (p2 - p0 + x * (2.f * p0 - 5.f * p1 + 4.f * p2 - p3 400d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams + x * (3.f * (p1 - p2) + p3 - p0))); 410d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams} 420d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams 430d6043caef208ee6c661eb17bcb376abfe90cd48Jason Samsuchar4 __attribute__((kernel)) bicubic(uint32_t x, uint32_t y) { 440d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams float xf = x * scale; 450d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams float yf = y * scale; 460d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams 470d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams int startx = (int) floor(xf - 2); 480d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams int starty = (int) floor(yf - 2); 490d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams xf = xf - floor(xf); 500d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams yf = yf - floor(yf); 510d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams int maxx = gWidthIn - 1; 520d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams int maxy = gHeightIn - 1; 530d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams 540d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams uint32_t xs0 = (uint32_t) max(0, startx + 0); 550d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams uint32_t xs1 = (uint32_t) max(0, startx + 1); 560d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams uint32_t xs2 = (uint32_t) min(maxx, startx + 2); 570d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams uint32_t xs3 = (uint32_t) min(maxx, startx + 3); 580d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams 590d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams uint32_t ys0 = (uint32_t) max(0, starty + 0); 600d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams uint32_t ys1 = (uint32_t) max(0, starty + 1); 610d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams uint32_t ys2 = (uint32_t) min(maxy, starty + 2); 620d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams uint32_t ys3 = (uint32_t) min(maxy, starty + 3); 630d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams 640d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams float4 p00 = convert_float4(rsGetElementAt_uchar4(gIn, xs0, ys0)); 650d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams float4 p01 = convert_float4(rsGetElementAt_uchar4(gIn, xs1, ys0)); 660d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams float4 p02 = convert_float4(rsGetElementAt_uchar4(gIn, xs2, ys0)); 670d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams float4 p03 = convert_float4(rsGetElementAt_uchar4(gIn, xs3, ys0)); 680ef64c5373a119eb73cbf7b1f7cf7d1da12d97d3Jason Sams float4 p0 = cubicInterpolate(p00, p01, p02, p03, xf); 690d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams 700d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams float4 p10 = convert_float4(rsGetElementAt_uchar4(gIn, xs0, ys1)); 710d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams float4 p11 = convert_float4(rsGetElementAt_uchar4(gIn, xs1, ys1)); 720d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams float4 p12 = convert_float4(rsGetElementAt_uchar4(gIn, xs2, ys1)); 730d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams float4 p13 = convert_float4(rsGetElementAt_uchar4(gIn, xs3, ys1)); 740ef64c5373a119eb73cbf7b1f7cf7d1da12d97d3Jason Sams float4 p1 = cubicInterpolate(p10, p11, p12, p13, xf); 750d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams 760d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams float4 p20 = convert_float4(rsGetElementAt_uchar4(gIn, xs0, ys2)); 770d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams float4 p21 = convert_float4(rsGetElementAt_uchar4(gIn, xs1, ys2)); 780d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams float4 p22 = convert_float4(rsGetElementAt_uchar4(gIn, xs2, ys2)); 790d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams float4 p23 = convert_float4(rsGetElementAt_uchar4(gIn, xs3, ys2)); 800ef64c5373a119eb73cbf7b1f7cf7d1da12d97d3Jason Sams float4 p2 = cubicInterpolate(p20, p21, p22, p23, xf); 810d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams 820d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams float4 p30 = convert_float4(rsGetElementAt_uchar4(gIn, xs0, ys3)); 830d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams float4 p31 = convert_float4(rsGetElementAt_uchar4(gIn, xs1, ys3)); 840d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams float4 p32 = convert_float4(rsGetElementAt_uchar4(gIn, xs2, ys3)); 850d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams float4 p33 = convert_float4(rsGetElementAt_uchar4(gIn, xs3, ys3)); 860ef64c5373a119eb73cbf7b1f7cf7d1da12d97d3Jason Sams float4 p3 = cubicInterpolate(p30, p31, p32, p33, xf); 870d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams 880ef64c5373a119eb73cbf7b1f7cf7d1da12d97d3Jason Sams float4 p = cubicInterpolate(p0, p1, p2, p3, yf); 89da68eff288c8b403bc41c1fa856ca09d73f35e2fMiao Wang p = clamp(p + 0.5f, 0.f, 255.f); 900d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams return convert_uchar4(p); 910d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams} 920d6043caef208ee6c661eb17bcb376abfe90cd48Jason Sams 93