blob: 1c9f6df831fef88222710dccbf35375dcacaa7dc [file] [log] [blame]
/*
* Copyright (c) 1997, 2003, Oracle and/or its affiliates. All rights reserved.
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
*
* This code is free software; you can redistribute it and/or modify it
* under the terms of the GNU General Public License version 2 only, as
* published by the Free Software Foundation. Oracle designates this
* particular file as subject to the "Classpath" exception as provided
* by Oracle in the LICENSE file that accompanied this code.
*
* This code is distributed in the hope that it will be useful, but WITHOUT
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
* version 2 for more details (a copy is included in the LICENSE file that
* accompanied this code).
*
* You should have received a copy of the GNU General Public License version
* 2 along with this work; if not, write to the Free Software Foundation,
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
*
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
* or visit www.oracle.com if you need additional information or have any
* questions.
*/
/*
* FUNCTION
* mlib_ImageAffine_u8_1ch_bl
* mlib_ImageAffine_u8_2ch_bl
* mlib_ImageAffine_u8_3ch_bl
* mlib_ImageAffine_u8_4ch_bl
* - image affine transformation with Bilinear filtering
* SYNOPSIS
* mlib_status mlib_ImageAffine_u8_?ch_bl(mlib_s32 *leftEdges,
* mlib_s32 *rightEdges,
* mlib_s32 *xStarts,
* mlib_s32 *yStarts,
* mlib_s32 *sides,
* mlib_u8 *dstData,
* mlib_u8 **lineAddr,
* mlib_s32 dstYStride,
* mlib_s32 is_affine,
* mlib_s32 srcYStride)
*
* ARGUMENTS
* leftEdges array[dstHeight] of xLeft coordinates
* RightEdges array[dstHeight] of xRight coordinates
* xStarts array[dstHeight] of xStart * 65536 coordinates
* yStarts array[dstHeight] of yStart * 65536 coordinates
* sides output array[4]. sides[0] is yStart, sides[1] is yFinish,
* sides[2] is dx * 65536, sides[3] is dy * 65536
* dstData pointer to the first pixel on (yStart - 1) line
* lineAddr array[srcHeight] of pointers to the first pixel on
* the corresponding lines
* dstYStride stride of destination image
* is_affine indicator (Affine - GridWarp)
* srcYStride stride of source image
*
* DESCRIPTION
* The functions step along the lines from xLeft to xRight and apply
* the bilinear filtering.
*
*/
#include "mlib_ImageAffine.h"
/***************************************************************/
#define DTYPE mlib_u8
#define FTYPE mlib_f32
/***************************************************************/
#define TTYPE mlib_f32
#define I2F(x) mlib_U82F32[x]
#define ROUND(x) ((x) + 0.5f)
#define FUN_NAME(CHAN) mlib_ImageAffine_u8_##CHAN##_bl
/***************************************************************/
#ifdef __sparc /* for SPARC, using floating-point multiplies is faster */
/***************************************************************/
#define GET_POINTERS(ind) \
fdx = (FTYPE)(X & MLIB_MASK) * scale; \
fdy = (FTYPE)(Y & MLIB_MASK) * scale; \
ySrc = MLIB_POINTER_SHIFT(Y); Y += dY; \
xSrc = X >> MLIB_SHIFT; X += dX; \
srcPixelPtr = MLIB_POINTER_GET(lineAddr, ySrc) + ind * xSrc; \
srcPixelPtr2 = (DTYPE *)((mlib_u8 *)srcPixelPtr + srcYStride)
/***************************************************************/
#define COUNT(ind) \
pix0_##ind = a00_##ind + fdy * (a10_##ind - a00_##ind); \
pix1_##ind = a01_##ind + fdy * (a11_##ind - a01_##ind); \
res##ind = ROUND(pix0_##ind + fdx * (pix1_##ind - pix0_##ind))
/***************************************************************/
#define LOAD(ind, ind1, ind2) \
a00_##ind = I2F(srcPixelPtr[ind1]); \
a01_##ind = I2F(srcPixelPtr[ind2]); \
a10_##ind = I2F(srcPixelPtr2[ind1]); \
a11_##ind = I2F(srcPixelPtr2[ind2])
/***************************************************************/
mlib_status FUN_NAME(1ch)(mlib_affine_param *param)
{
DECLAREVAR_BL();
DTYPE *dstLineEnd;
DTYPE *srcPixelPtr2;
FTYPE scale = (FTYPE) 1.0 / MLIB_PREC;
for (j = yStart; j <= yFinish; j++) {
FTYPE fdx, fdy;
TTYPE a00_0, a01_0, a10_0, a11_0;
FTYPE pix0_0, pix1_0, res0;
CLIP(1);
dstLineEnd = (DTYPE *) dstData + xRight;
GET_POINTERS(1);
LOAD(0, 0, 1);
#ifdef __SUNPRO_C
#pragma pipeloop(0)
#endif /* __SUNPRO_C */
for (; dstPixelPtr < dstLineEnd; dstPixelPtr++) {
COUNT(0);
GET_POINTERS(1);
LOAD(0, 0, 1);
dstPixelPtr[0] = (DTYPE) res0;
}
COUNT(0);
dstPixelPtr[0] = (DTYPE) res0;
}
return MLIB_SUCCESS;
}
/***************************************************************/
mlib_status FUN_NAME(2ch)(mlib_affine_param *param)
{
DECLAREVAR_BL();
DTYPE *dstLineEnd;
DTYPE *srcPixelPtr2;
FTYPE scale = (FTYPE) 1.0 / MLIB_PREC;
for (j = yStart; j <= yFinish; j++) {
FTYPE fdx, fdy;
TTYPE a00_0, a01_0, a10_0, a11_0;
TTYPE a00_1, a01_1, a10_1, a11_1;
FTYPE pix0_0, pix1_0, res0;
FTYPE pix0_1, pix1_1, res1;
CLIP(2);
dstLineEnd = (DTYPE *) dstData + 2 * xRight;
GET_POINTERS(2);
LOAD(0, 0, 2);
LOAD(1, 1, 3);
#ifdef __SUNPRO_C
#pragma pipeloop(0)
#endif /* __SUNPRO_C */
for (; dstPixelPtr < dstLineEnd; dstPixelPtr += 2) {
COUNT(0);
COUNT(1);
GET_POINTERS(2);
LOAD(0, 0, 2);
LOAD(1, 1, 3);
dstPixelPtr[0] = (DTYPE) res0;
dstPixelPtr[1] = (DTYPE) res1;
}
COUNT(0);
COUNT(1);
dstPixelPtr[0] = (DTYPE) res0;
dstPixelPtr[1] = (DTYPE) res1;
}
return MLIB_SUCCESS;
}
/***************************************************************/
mlib_status FUN_NAME(3ch)(mlib_affine_param *param)
{
DECLAREVAR_BL();
DTYPE *dstLineEnd;
DTYPE *srcPixelPtr2;
FTYPE scale = (FTYPE) 1.0 / MLIB_PREC;
for (j = yStart; j <= yFinish; j++) {
FTYPE fdx, fdy;
FTYPE a00_0, a01_0, a10_0, a11_0;
FTYPE a00_1, a01_1, a10_1, a11_1;
FTYPE a00_2, a01_2, a10_2, a11_2;
FTYPE pix0_0, pix1_0, res0;
FTYPE pix0_1, pix1_1, res1;
FTYPE pix0_2, pix1_2, res2;
CLIP(3);
dstLineEnd = (DTYPE *) dstData + 3 * xRight;
GET_POINTERS(3);
LOAD(0, 0, 3);
LOAD(1, 1, 4);
LOAD(2, 2, 5);
#ifdef __SUNPRO_C
#pragma pipeloop(0)
#endif /* __SUNPRO_C */
for (; dstPixelPtr < dstLineEnd; dstPixelPtr += 3) {
COUNT(0);
COUNT(1);
COUNT(2);
GET_POINTERS(3);
LOAD(0, 0, 3);
LOAD(1, 1, 4);
LOAD(2, 2, 5);
dstPixelPtr[0] = (DTYPE) res0;
dstPixelPtr[1] = (DTYPE) res1;
dstPixelPtr[2] = (DTYPE) res2;
}
COUNT(0);
COUNT(1);
COUNT(2);
dstPixelPtr[0] = (DTYPE) res0;
dstPixelPtr[1] = (DTYPE) res1;
dstPixelPtr[2] = (DTYPE) res2;
}
return MLIB_SUCCESS;
}
/***************************************************************/
mlib_status FUN_NAME(4ch)(mlib_affine_param *param)
{
DECLAREVAR_BL();
DTYPE *dstLineEnd;
DTYPE *srcPixelPtr2;
FTYPE scale = (FTYPE) 1.0 / MLIB_PREC;
for (j = yStart; j <= yFinish; j++) {
FTYPE fdx, fdy;
TTYPE a00_0, a01_0, a10_0, a11_0;
TTYPE a00_1, a01_1, a10_1, a11_1;
TTYPE a00_2, a01_2, a10_2, a11_2;
TTYPE a00_3, a01_3, a10_3, a11_3;
FTYPE pix0_0, pix1_0, res0;
FTYPE pix0_1, pix1_1, res1;
FTYPE pix0_2, pix1_2, res2;
FTYPE pix0_3, pix1_3, res3;
CLIP(4);
dstLineEnd = (DTYPE *) dstData + 4 * xRight;
GET_POINTERS(4);
LOAD(0, 0, 4);
LOAD(1, 1, 5);
LOAD(2, 2, 6);
LOAD(3, 3, 7);
#ifdef __SUNPRO_C
#pragma pipeloop(0)
#endif /* __SUNPRO_C */
for (; dstPixelPtr < dstLineEnd; dstPixelPtr += 4) {
COUNT(0);
COUNT(1);
COUNT(2);
COUNT(3);
GET_POINTERS(4);
LOAD(0, 0, 4);
LOAD(1, 1, 5);
LOAD(2, 2, 6);
LOAD(3, 3, 7);
dstPixelPtr[0] = (DTYPE) res0;
dstPixelPtr[1] = (DTYPE) res1;
dstPixelPtr[2] = (DTYPE) res2;
dstPixelPtr[3] = (DTYPE) res3;
}
COUNT(0);
COUNT(1);
COUNT(2);
COUNT(3);
dstPixelPtr[0] = (DTYPE) res0;
dstPixelPtr[1] = (DTYPE) res1;
dstPixelPtr[2] = (DTYPE) res2;
dstPixelPtr[3] = (DTYPE) res3;
}
return MLIB_SUCCESS;
}
#else /* for x86, using integer multiplies is faster */
/* for SHORT/USHORT decrease MLIB_SHIFT due to
* overflow in multiplies like fdy * (a10 - a00)
*/
/*
#undef MLIB_SHIFT
#define MLIB_SHIFT 15
*/
#define MLIB_ROUND (1 << (MLIB_SHIFT - 1))
/***************************************************************/
#define GET_POINTERS(ind) \
fdx = X & MLIB_MASK; \
fdy = Y & MLIB_MASK; \
ySrc = MLIB_POINTER_SHIFT(Y); \
xSrc = X >> MLIB_SHIFT; \
srcPixelPtr = MLIB_POINTER_GET(lineAddr, ySrc) + ind * xSrc; \
srcPixelPtr2 = (DTYPE *)((mlib_u8 *)srcPixelPtr + srcYStride); \
X += dX; \
Y += dY
/***************************************************************/
#define COUNT(ind) \
pix0_##ind = a00_##ind + ((fdy * (a10_##ind - a00_##ind) + MLIB_ROUND) >> MLIB_SHIFT); \
pix1_##ind = a01_##ind + ((fdy * (a11_##ind - a01_##ind) + MLIB_ROUND) >> MLIB_SHIFT); \
res##ind = pix0_##ind + ((fdx * (pix1_##ind - pix0_##ind) + MLIB_ROUND) >> MLIB_SHIFT)
/***************************************************************/
#define LOAD(ind, ind1, ind2) \
a00_##ind = srcPixelPtr[ind1]; \
a01_##ind = srcPixelPtr[ind2]; \
a10_##ind = srcPixelPtr2[ind1]; \
a11_##ind = srcPixelPtr2[ind2]
/***************************************************************/
mlib_status FUN_NAME(1ch)(mlib_affine_param *param)
{
DECLAREVAR_BL();
DTYPE *dstLineEnd;
DTYPE *srcPixelPtr2;
#if MLIB_SHIFT == 15
dX = (dX + 1) >> 1;
dY = (dY + 1) >> 1;
#endif /* MLIB_SHIFT == 15 */
for (j = yStart; j <= yFinish; j++) {
mlib_s32 fdx, fdy;
mlib_s32 a00_0, a01_0, a10_0, a11_0;
mlib_s32 pix0_0, pix1_0, res0;
CLIP(1);
dstLineEnd = (DTYPE *) dstData + xRight;
#if MLIB_SHIFT == 15
X = X >> 1;
Y = Y >> 1;
#endif /* MLIB_SHIFT == 15 */
GET_POINTERS(1);
LOAD(0, 0, 1);
#ifdef __SUNPRO_C
#pragma pipeloop(0)
#endif /* __SUNPRO_C */
for (; dstPixelPtr < dstLineEnd; dstPixelPtr++) {
COUNT(0);
GET_POINTERS(1);
LOAD(0, 0, 1);
dstPixelPtr[0] = (DTYPE) res0;
}
COUNT(0);
dstPixelPtr[0] = (DTYPE) res0;
}
return MLIB_SUCCESS;
}
/***************************************************************/
mlib_status FUN_NAME(2ch)(mlib_affine_param *param)
{
DECLAREVAR_BL();
DTYPE *dstLineEnd;
DTYPE *srcPixelPtr2;
#if MLIB_SHIFT == 15
dX = (dX + 1) >> 1;
dY = (dY + 1) >> 1;
#endif /* MLIB_SHIFT == 15 */
for (j = yStart; j <= yFinish; j++) {
mlib_s32 fdx, fdy;
mlib_s32 a00_0, a01_0, a10_0, a11_0;
mlib_s32 a00_1, a01_1, a10_1, a11_1;
mlib_s32 pix0_0, pix1_0, res0;
mlib_s32 pix0_1, pix1_1, res1;
CLIP(2);
dstLineEnd = (DTYPE *) dstData + 2 * xRight;
#if MLIB_SHIFT == 15
X = X >> 1;
Y = Y >> 1;
#endif /* MLIB_SHIFT == 15 */
GET_POINTERS(2);
LOAD(0, 0, 2);
LOAD(1, 1, 3);
#ifdef __SUNPRO_C
#pragma pipeloop(0)
#endif /* __SUNPRO_C */
for (; dstPixelPtr < dstLineEnd; dstPixelPtr += 2) {
COUNT(0);
COUNT(1);
GET_POINTERS(2);
LOAD(0, 0, 2);
LOAD(1, 1, 3);
dstPixelPtr[0] = (DTYPE) res0;
dstPixelPtr[1] = (DTYPE) res1;
}
COUNT(0);
COUNT(1);
dstPixelPtr[0] = (DTYPE) res0;
dstPixelPtr[1] = (DTYPE) res1;
}
return MLIB_SUCCESS;
}
/***************************************************************/
mlib_status FUN_NAME(3ch)(mlib_affine_param *param)
{
DECLAREVAR_BL();
DTYPE *dstLineEnd;
DTYPE *srcPixelPtr2;
#if MLIB_SHIFT == 15
dX = (dX + 1) >> 1;
dY = (dY + 1) >> 1;
#endif /* MLIB_SHIFT == 15 */
for (j = yStart; j <= yFinish; j++) {
mlib_s32 fdx, fdy;
mlib_s32 a00_0, a01_0, a10_0, a11_0;
mlib_s32 a00_1, a01_1, a10_1, a11_1;
mlib_s32 a00_2, a01_2, a10_2, a11_2;
mlib_s32 pix0_0, pix1_0, res0;
mlib_s32 pix0_1, pix1_1, res1;
mlib_s32 pix0_2, pix1_2, res2;
CLIP(3);
dstLineEnd = (DTYPE *) dstData + 3 * xRight;
#if MLIB_SHIFT == 15
X = X >> 1;
Y = Y >> 1;
#endif /* MLIB_SHIFT == 15 */
GET_POINTERS(3);
LOAD(0, 0, 3);
LOAD(1, 1, 4);
LOAD(2, 2, 5);
#ifdef __SUNPRO_C
#pragma pipeloop(0)
#endif /* __SUNPRO_C */
for (; dstPixelPtr < dstLineEnd; dstPixelPtr += 3) {
COUNT(0);
COUNT(1);
COUNT(2);
GET_POINTERS(3);
LOAD(0, 0, 3);
LOAD(1, 1, 4);
LOAD(2, 2, 5);
dstPixelPtr[0] = (DTYPE) res0;
dstPixelPtr[1] = (DTYPE) res1;
dstPixelPtr[2] = (DTYPE) res2;
}
COUNT(0);
COUNT(1);
COUNT(2);
dstPixelPtr[0] = (DTYPE) res0;
dstPixelPtr[1] = (DTYPE) res1;
dstPixelPtr[2] = (DTYPE) res2;
}
return MLIB_SUCCESS;
}
/***************************************************************/
mlib_status FUN_NAME(4ch)(mlib_affine_param *param)
{
DECLAREVAR_BL();
DTYPE *dstLineEnd;
DTYPE *srcPixelPtr2;
#if MLIB_SHIFT == 15
dX = (dX + 1) >> 1;
dY = (dY + 1) >> 1;
#endif /* MLIB_SHIFT == 15 */
for (j = yStart; j <= yFinish; j++) {
mlib_s32 fdx, fdy;
mlib_s32 a00_0, a01_0, a10_0, a11_0;
mlib_s32 a00_1, a01_1, a10_1, a11_1;
mlib_s32 a00_2, a01_2, a10_2, a11_2;
mlib_s32 a00_3, a01_3, a10_3, a11_3;
mlib_s32 pix0_0, pix1_0, res0;
mlib_s32 pix0_1, pix1_1, res1;
mlib_s32 pix0_2, pix1_2, res2;
mlib_s32 pix0_3, pix1_3, res3;
CLIP(4);
dstLineEnd = (DTYPE *) dstData + 4 * xRight;
#if MLIB_SHIFT == 15
X = X >> 1;
Y = Y >> 1;
#endif /* MLIB_SHIFT == 15 */
GET_POINTERS(4);
LOAD(0, 0, 4);
LOAD(1, 1, 5);
LOAD(2, 2, 6);
LOAD(3, 3, 7);
#ifdef __SUNPRO_C
#pragma pipeloop(0)
#endif /* __SUNPRO_C */
for (; dstPixelPtr < dstLineEnd; dstPixelPtr += 4) {
COUNT(0);
COUNT(1);
COUNT(2);
COUNT(3);
GET_POINTERS(4);
LOAD(0, 0, 4);
LOAD(1, 1, 5);
LOAD(2, 2, 6);
LOAD(3, 3, 7);
dstPixelPtr[0] = (DTYPE) res0;
dstPixelPtr[1] = (DTYPE) res1;
dstPixelPtr[2] = (DTYPE) res2;
dstPixelPtr[3] = (DTYPE) res3;
}
COUNT(0);
COUNT(1);
COUNT(2);
COUNT(3);
dstPixelPtr[0] = (DTYPE) res0;
dstPixelPtr[1] = (DTYPE) res1;
dstPixelPtr[2] = (DTYPE) res2;
dstPixelPtr[3] = (DTYPE) res3;
}
return MLIB_SUCCESS;
}
#endif /* __sparc ( for SPARC, using floating-point multiplies is faster ) */
/***************************************************************/