blob: 77da230bda4e825a1177b6ea62688b57ded3efc9 [file] [log] [blame]
/*
* Copyright (C) 2013 The Android Open Source Project
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#include "shared.rsh"
int32_t gWidth;
int32_t gHeight;
rs_allocation gIn;
float gCoeffs[9];
uchar4 __attribute__((kernel)) convolve_U4(uint32_t x, uint32_t y) {
uint32_t x1 = min((int32_t)x+1, gWidth-1);
uint32_t x2 = max((int32_t)x-1, 0);
uint32_t y1 = min((int32_t)y+1, gHeight-1);
uint32_t y2 = max((int32_t)y-1, 0);
float4 p00 = convert_float4(rsGetElementAt_uchar4(gIn, x1, y1));
float4 p01 = convert_float4(rsGetElementAt_uchar4(gIn, x, y1));
float4 p02 = convert_float4(rsGetElementAt_uchar4(gIn, x2, y1));
float4 p10 = convert_float4(rsGetElementAt_uchar4(gIn, x1, y));
float4 p11 = convert_float4(rsGetElementAt_uchar4(gIn, x, y));
float4 p12 = convert_float4(rsGetElementAt_uchar4(gIn, x2, y));
float4 p20 = convert_float4(rsGetElementAt_uchar4(gIn, x1, y2));
float4 p21 = convert_float4(rsGetElementAt_uchar4(gIn, x, y2));
float4 p22 = convert_float4(rsGetElementAt_uchar4(gIn, x2, y2));
p00 *= gCoeffs[0];
p01 *= gCoeffs[1];
p02 *= gCoeffs[2];
p10 *= gCoeffs[3];
p11 *= gCoeffs[4];
p12 *= gCoeffs[5];
p20 *= gCoeffs[6];
p21 *= gCoeffs[7];
p22 *= gCoeffs[8];
p00 += p01;
p02 += p10;
p11 += p12;
p20 += p21;
p22 += p00;
p02 += p11;
p20 += p22;
p20 += p02;
p20 += 0.5f;
p20 = clamp(p20, 0.f, 255.f);
return convert_uchar4(p20);
}
uchar3 __attribute__((kernel)) convolve_U3(uint32_t x, uint32_t y) {
uint32_t x1 = min((int32_t)x+1, gWidth-1);
uint32_t x2 = max((int32_t)x-1, 0);
uint32_t y1 = min((int32_t)y+1, gHeight-1);
uint32_t y2 = max((int32_t)y-1, 0);
float3 p00 = convert_float3(rsGetElementAt_uchar3(gIn, x1, y1));
float3 p01 = convert_float3(rsGetElementAt_uchar3(gIn, x, y1));
float3 p02 = convert_float3(rsGetElementAt_uchar3(gIn, x2, y1));
float3 p10 = convert_float3(rsGetElementAt_uchar3(gIn, x1, y));
float3 p11 = convert_float3(rsGetElementAt_uchar3(gIn, x, y));
float3 p12 = convert_float3(rsGetElementAt_uchar3(gIn, x2, y));
float3 p20 = convert_float3(rsGetElementAt_uchar3(gIn, x1, y2));
float3 p21 = convert_float3(rsGetElementAt_uchar3(gIn, x, y2));
float3 p22 = convert_float3(rsGetElementAt_uchar3(gIn, x2, y2));
p00 *= gCoeffs[0];
p01 *= gCoeffs[1];
p02 *= gCoeffs[2];
p10 *= gCoeffs[3];
p11 *= gCoeffs[4];
p12 *= gCoeffs[5];
p20 *= gCoeffs[6];
p21 *= gCoeffs[7];
p22 *= gCoeffs[8];
p00 += p01;
p02 += p10;
p11 += p12;
p20 += p21;
p22 += p00;
p02 += p11;
p20 += p22;
p20 += p02;
p20 += 0.5f;
p20 = clamp(p20, 0.f, 255.f);
return convert_uchar3(p20);
}
uchar2 __attribute__((kernel)) convolve_U2(uint32_t x, uint32_t y) {
uint32_t x1 = min((int32_t)x+1, gWidth-1);
uint32_t x2 = max((int32_t)x-1, 0);
uint32_t y1 = min((int32_t)y+1, gHeight-1);
uint32_t y2 = max((int32_t)y-1, 0);
float2 p00 = convert_float2(rsGetElementAt_uchar2(gIn, x1, y1));
float2 p01 = convert_float2(rsGetElementAt_uchar2(gIn, x, y1));
float2 p02 = convert_float2(rsGetElementAt_uchar2(gIn, x2, y1));
float2 p10 = convert_float2(rsGetElementAt_uchar2(gIn, x1, y));
float2 p11 = convert_float2(rsGetElementAt_uchar2(gIn, x, y));
float2 p12 = convert_float2(rsGetElementAt_uchar2(gIn, x2, y));
float2 p20 = convert_float2(rsGetElementAt_uchar2(gIn, x1, y2));
float2 p21 = convert_float2(rsGetElementAt_uchar2(gIn, x, y2));
float2 p22 = convert_float2(rsGetElementAt_uchar2(gIn, x2, y2));
p00 *= gCoeffs[0];
p01 *= gCoeffs[1];
p02 *= gCoeffs[2];
p10 *= gCoeffs[3];
p11 *= gCoeffs[4];
p12 *= gCoeffs[5];
p20 *= gCoeffs[6];
p21 *= gCoeffs[7];
p22 *= gCoeffs[8];
p00 += p01;
p02 += p10;
p11 += p12;
p20 += p21;
p22 += p00;
p02 += p11;
p20 += p22;
p20 += p02;
p20 += 0.5f;
p20 = clamp(p20, 0.f, 255.f);
return convert_uchar2(p20);
}
uchar __attribute__((kernel)) convolve_U1(uint32_t x, uint32_t y) {
uint32_t x1 = min((int32_t)x+1, gWidth-1);
uint32_t x2 = max((int32_t)x-1, 0);
uint32_t y1 = min((int32_t)y+1, gHeight-1);
uint32_t y2 = max((int32_t)y-1, 0);
float p00 = rsGetElementAt_uchar(gIn, x1, y1);
float p01 = rsGetElementAt_uchar(gIn, x, y1);
float p02 = rsGetElementAt_uchar(gIn, x2, y1);
float p10 = rsGetElementAt_uchar(gIn, x1, y);
float p11 = rsGetElementAt_uchar(gIn, x, y);
float p12 = rsGetElementAt_uchar(gIn, x2, y);
float p20 = rsGetElementAt_uchar(gIn, x1, y2);
float p21 = rsGetElementAt_uchar(gIn, x, y2);
float p22 = rsGetElementAt_uchar(gIn, x2, y2);
p00 *= gCoeffs[0];
p01 *= gCoeffs[1];
p02 *= gCoeffs[2];
p10 *= gCoeffs[3];
p11 *= gCoeffs[4];
p12 *= gCoeffs[5];
p20 *= gCoeffs[6];
p21 *= gCoeffs[7];
p22 *= gCoeffs[8];
p00 += p01;
p02 += p10;
p11 += p12;
p20 += p21;
p22 += p00;
p02 += p11;
p20 += p22;
p20 += p02;
p20 += 0.5f;
p20 = clamp(p20, 0.f, 255.f);
return (uchar)p20;
}
float4 __attribute__((kernel)) convolve_F4(uint32_t x, uint32_t y) {
uint32_t x1 = min((int32_t)x+1, gWidth-1);
uint32_t x2 = max((int32_t)x-1, 0);
uint32_t y1 = min((int32_t)y+1, gHeight-1);
uint32_t y2 = max((int32_t)y-1, 0);
float4 p00 = rsGetElementAt_float4(gIn, x1, y1) * gCoeffs[0];
float4 p01 = rsGetElementAt_float4(gIn, x, y1) * gCoeffs[1];
float4 p02 = rsGetElementAt_float4(gIn, x2, y1) * gCoeffs[2];
float4 p10 = rsGetElementAt_float4(gIn, x1, y) * gCoeffs[3];
float4 p11 = rsGetElementAt_float4(gIn, x, y) * gCoeffs[4];
float4 p12 = rsGetElementAt_float4(gIn, x2, y) * gCoeffs[5];
float4 p20 = rsGetElementAt_float4(gIn, x1, y2) * gCoeffs[6];
float4 p21 = rsGetElementAt_float4(gIn, x, y2) * gCoeffs[7];
float4 p22 = rsGetElementAt_float4(gIn, x2, y2) * gCoeffs[8];
p00 += p01;
p02 += p10;
p11 += p12;
p20 += p21;
p22 += p00;
p02 += p11;
p20 += p22;
p20 += p02;
return p20;
}
float3 __attribute__((kernel)) convolve_F3(uint32_t x, uint32_t y) {
uint32_t x1 = min((int32_t)x+1, gWidth-1);
uint32_t x2 = max((int32_t)x-1, 0);
uint32_t y1 = min((int32_t)y+1, gHeight-1);
uint32_t y2 = max((int32_t)y-1, 0);
float3 p00 = rsGetElementAt_float3(gIn, x1, y1) * gCoeffs[0];
float3 p01 = rsGetElementAt_float3(gIn, x, y1) * gCoeffs[1];
float3 p02 = rsGetElementAt_float3(gIn, x2, y1) * gCoeffs[2];
float3 p10 = rsGetElementAt_float3(gIn, x1, y) * gCoeffs[3];
float3 p11 = rsGetElementAt_float3(gIn, x, y) * gCoeffs[4];
float3 p12 = rsGetElementAt_float3(gIn, x2, y) * gCoeffs[5];
float3 p20 = rsGetElementAt_float3(gIn, x1, y2) * gCoeffs[6];
float3 p21 = rsGetElementAt_float3(gIn, x, y2) * gCoeffs[7];
float3 p22 = rsGetElementAt_float3(gIn, x2, y2) * gCoeffs[8];
p00 += p01;
p02 += p10;
p11 += p12;
p20 += p21;
p22 += p00;
p02 += p11;
p20 += p22;
p20 += p02;
return p20;
}
float2 __attribute__((kernel)) convolve_F2(uint32_t x, uint32_t y) {
uint32_t x1 = min((int32_t)x+1, gWidth-1);
uint32_t x2 = max((int32_t)x-1, 0);
uint32_t y1 = min((int32_t)y+1, gHeight-1);
uint32_t y2 = max((int32_t)y-1, 0);
float2 p00 = rsGetElementAt_float2(gIn, x1, y1) * gCoeffs[0];
float2 p01 = rsGetElementAt_float2(gIn, x, y1) * gCoeffs[1];
float2 p02 = rsGetElementAt_float2(gIn, x2, y1) * gCoeffs[2];
float2 p10 = rsGetElementAt_float2(gIn, x1, y) * gCoeffs[3];
float2 p11 = rsGetElementAt_float2(gIn, x, y) * gCoeffs[4];
float2 p12 = rsGetElementAt_float2(gIn, x2, y) * gCoeffs[5];
float2 p20 = rsGetElementAt_float2(gIn, x1, y2) * gCoeffs[6];
float2 p21 = rsGetElementAt_float2(gIn, x, y2) * gCoeffs[7];
float2 p22 = rsGetElementAt_float2(gIn, x2, y2) * gCoeffs[8];
p00 += p01;
p02 += p10;
p11 += p12;
p20 += p21;
p22 += p00;
p02 += p11;
p20 += p22;
p20 += p02;
return p20;
}
float __attribute__((kernel)) convolve_F1(uint32_t x, uint32_t y) {
uint32_t x1 = min((int32_t)x+1, gWidth-1);
uint32_t x2 = max((int32_t)x-1, 0);
uint32_t y1 = min((int32_t)y+1, gHeight-1);
uint32_t y2 = max((int32_t)y-1, 0);
float p00 = rsGetElementAt_float(gIn, x1, y1) * gCoeffs[0];
float p01 = rsGetElementAt_float(gIn, x, y1) * gCoeffs[1];
float p02 = rsGetElementAt_float(gIn, x2, y1) * gCoeffs[2];
float p10 = rsGetElementAt_float(gIn, x1, y) * gCoeffs[3];
float p11 = rsGetElementAt_float(gIn, x, y) * gCoeffs[4];
float p12 = rsGetElementAt_float(gIn, x2, y) * gCoeffs[5];
float p20 = rsGetElementAt_float(gIn, x1, y2) * gCoeffs[6];
float p21 = rsGetElementAt_float(gIn, x, y2) * gCoeffs[7];
float p22 = rsGetElementAt_float(gIn, x2, y2) * gCoeffs[8];
p00 += p01;
p02 += p10;
p11 += p12;
p20 += p21;
p22 += p00;
p02 += p11;
p20 += p22;
p20 += p02;
return p20;
}