blob: 67967ed458c4ca1581238b367b8bc4bd1bb81a3b [file] [log] [blame]
/*
* Copyright (c) 2003, Oracle and/or its affiliates. All rights reserved.
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
*
* This code is free software; you can redistribute it and/or modify it
* under the terms of the GNU General Public License version 2 only, as
* published by the Free Software Foundation. Oracle designates this
* particular file as subject to the "Classpath" exception as provided
* by Oracle in the LICENSE file that accompanied this code.
*
* This code is distributed in the hope that it will be useful, but WITHOUT
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
* version 2 for more details (a copy is included in the LICENSE file that
* accompanied this code).
*
* You should have received a copy of the GNU General Public License version
* 2 along with this work; if not, write to the Free Software Foundation,
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
*
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
* or visit www.oracle.com if you need additional information or have any
* questions.
*/
#if !defined(JAVA2D_NO_MLIB) || defined(MLIB_ADD_SUFF)
#include "vis_AlphaMacros.h"
/***************************************************************/
/* ##############################################################
* IntArgbToIntArgbAlphaMaskBlit()
* IntArgbToFourByteAbgrAlphaMaskBlit()
*/
#define MASK_FILL(rr, pathA, dstA, dstARGB, srcA, srcARGB) \
{ \
mlib_s32 srcF, dstF; \
\
srcA = mul8_extra[srcA]; \
\
srcF = ((dstA & SrcOpAnd) ^ SrcOpXor) + SrcOpAdd; \
dstF = ((srcA & DstOpAnd) ^ DstOpXor) + DstOpAdd; \
\
srcF = MUL8_INT(pathA, srcF); \
dstF = MUL8_INT(pathA, dstF) + (0xff - pathA); \
\
srcA = MUL8_INT(srcF, srcA); \
dstA = MUL8_INT(dstF, dstA); \
\
BLEND_VIS(rr, dstARGB, srcARGB, dstA, srcA); \
}
/***************************************************************/
static void IntArgbToIntArgbAlphaMaskBlit_line(mlib_f32 *dst_ptr,
mlib_f32 *src_ptr,
mlib_u8 *pMask,
mlib_s32 width,
mlib_s32 *log_val,
mlib_u8 *mul8_extra,
mlib_u8 *mul8_tbl)
{
mlib_s32 i, i0;
mlib_s32 pathA0, pathA1, dstA0, dstA1, srcA0, srcA1, msk;
mlib_d64 res0, res1, dstARGB;
mlib_f32 dstARGB0, srcARGB0, srcARGB1;
mlib_s32 SrcOpAnd = log_val[0];
mlib_s32 SrcOpXor = log_val[1];
mlib_s32 SrcOpAdd = log_val[2];
mlib_s32 DstOpAnd = log_val[3];
mlib_s32 DstOpXor = log_val[4];
mlib_s32 DstOpAdd = log_val[5];
i = i0 = 0;
if ((mlib_s32)dst_ptr & 7) {
pathA0 = pMask[i];
if (pathA0) {
dstA0 = *(mlib_u8*)(dst_ptr + i);
srcA0 = *(mlib_u8*)(src_ptr + i);
dstARGB0 = dst_ptr[i];
srcARGB0 = src_ptr[i];
MASK_FILL(res0, pathA0, dstA0, dstARGB0, srcA0, srcARGB0);
dst_ptr[i] = vis_fpack16(res0);
*(mlib_u8*)(dst_ptr + i) = dstA0;
}
i0 = 1;
}
#pragma pipeloop(0)
for (i = i0; i <= width - 2; i += 2) {
pathA0 = pMask[i];
pathA1 = pMask[i + 1];
dstA0 = *(mlib_u8*)(dst_ptr + i);
dstA1 = *(mlib_u8*)(dst_ptr + i + 1);
dstARGB = *(mlib_d64*)(dst_ptr + i);
srcA0 = *(mlib_u8*)(src_ptr + i);
srcA1 = *(mlib_u8*)(src_ptr + i + 1);
srcARGB0 = src_ptr[i];
srcARGB1 = src_ptr[i + 1];
MASK_FILL(res0, pathA0, dstA0, vis_read_hi(dstARGB), srcA0, srcARGB0);
MASK_FILL(res1, pathA1, dstA1, vis_read_lo(dstARGB), srcA1, srcARGB1);
res0 = vis_fpack16_pair(res0, res1);
msk = (((-pathA0) & (1 << 11)) | ((-pathA1) & (1 << 10))) >> 10;
vis_pst_32(res0, dst_ptr + i, msk);
*(mlib_u8*)(dst_ptr + i ) = dstA0;
*(mlib_u8*)(dst_ptr + i + 1) = dstA1;
}
if (i < width) {
pathA0 = pMask[i];
if (pathA0) {
dstA0 = *(mlib_u8*)(dst_ptr + i);
srcA0 = *(mlib_u8*)(src_ptr + i);
dstARGB0 = dst_ptr[i];
srcARGB0 = src_ptr[i];
MASK_FILL(res0, pathA0, dstA0, dstARGB0, srcA0, srcARGB0);
dst_ptr[i] = vis_fpack16(res0);
*(mlib_u8*)(dst_ptr + i) = dstA0;
}
}
}
/***************************************************************/
#undef MASK_FILL
#define MASK_FILL(rr, pathA, dstA, dstARGB, srcA, srcARGB) \
{ \
mlib_s32 srcF, dstF; \
\
srcA = mul8_extra[srcA]; \
\
srcF = ((dstA & SrcOpAnd) ^ SrcOpXor) + SrcOpAdd; \
dstF = ((srcA & DstOpAnd) ^ DstOpXor) + DstOpAdd; \
\
srcA = MUL8_INT(srcF, srcA); \
dstA = MUL8_INT(dstF, dstA); \
\
BLEND_VIS(rr, dstARGB, srcARGB, dstA, srcA); \
}
/***************************************************************/
static void IntArgbToIntArgbAlphaMaskBlit_A1_line(mlib_f32 *dst_ptr,
mlib_f32 *src_ptr,
mlib_u8 *pMask,
mlib_s32 width,
mlib_s32 *log_val,
mlib_u8 *mul8_extra,
mlib_u8 *mul8_tbl)
{
mlib_s32 i;
mlib_s32 dstA0, srcA0;
mlib_d64 res0;
mlib_f32 dstARGB0, srcARGB0;
mlib_s32 SrcOpAnd = log_val[0];
mlib_s32 SrcOpXor = log_val[1];
mlib_s32 SrcOpAdd = log_val[2];
mlib_s32 DstOpAnd = log_val[3];
mlib_s32 DstOpXor = log_val[4];
mlib_s32 DstOpAdd = log_val[5];
#pragma pipeloop(0)
for (i = 0; i < width; i++) {
dstA0 = *(mlib_u8*)(dst_ptr + i);
srcA0 = *(mlib_u8*)(src_ptr + i);
dstARGB0 = dst_ptr[i];
srcARGB0 = src_ptr[i];
MASK_FILL(res0, pathA0, dstA0, dstARGB0, srcA0, srcARGB0);
dst_ptr[i] = vis_fpack16(res0);
*(mlib_u8*)(dst_ptr + i) = dstA0;
}
}
/***************************************************************/
void ADD_SUFF(IntArgbToIntArgbAlphaMaskBlit)(MASKBLIT_PARAMS)
{
mlib_s32 extraA;
mlib_s32 dstScan = pDstInfo->scanStride;
mlib_s32 srcScan = pSrcInfo->scanStride;
mlib_s32 log_val[6];
mlib_s32 j;
mlib_s32 SrcOpAnd;
mlib_s32 SrcOpXor;
mlib_s32 SrcOpAdd;
mlib_s32 DstOpAnd;
mlib_s32 DstOpXor;
mlib_s32 DstOpAdd;
mlib_u8 *mul8_extra;
extraA = (mlib_s32)(pCompInfo->details.extraAlpha * 255.0 + 0.5);
mul8_extra = mul8table[extraA];
SrcOpAnd = (AlphaRules[pCompInfo->rule].srcOps).andval;
SrcOpXor = (AlphaRules[pCompInfo->rule].srcOps).xorval;
SrcOpAdd = (AlphaRules[pCompInfo->rule].srcOps).addval;
SrcOpAdd -= SrcOpXor;
DstOpAnd = (AlphaRules[pCompInfo->rule].dstOps).andval;
DstOpXor = (AlphaRules[pCompInfo->rule].dstOps).xorval;
DstOpAdd = (AlphaRules[pCompInfo->rule].dstOps).addval;
DstOpAdd -= DstOpXor;
log_val[0] = SrcOpAnd;
log_val[1] = SrcOpXor;
log_val[2] = SrcOpAdd;
log_val[3] = DstOpAnd;
log_val[4] = DstOpXor;
log_val[5] = DstOpAdd;
vis_write_gsr(7 << 3);
if (pMask != NULL) {
pMask += maskOff;
if (dstScan == 4*width && srcScan == dstScan && maskScan == width) {
width *= height;
height = 1;
}
for (j = 0; j < height; j++) {
IntArgbToIntArgbAlphaMaskBlit_line(dstBase, srcBase, pMask,
width, log_val, mul8_extra,
(void*)mul8table);
PTR_ADD(dstBase, dstScan);
PTR_ADD(srcBase, srcScan);
PTR_ADD(pMask, maskScan);
}
} else {
if (dstScan == 4*width && srcScan == dstScan) {
width *= height;
height = 1;
}
for (j = 0; j < height; j++) {
IntArgbToIntArgbAlphaMaskBlit_A1_line(dstBase, srcBase, pMask,
width, log_val, mul8_extra,
(void*)mul8table);
PTR_ADD(dstBase, dstScan);
PTR_ADD(srcBase, srcScan);
}
}
}
/***************************************************************/
void ADD_SUFF(IntArgbToFourByteAbgrAlphaMaskBlit)(MASKBLIT_PARAMS)
{
mlib_d64 buff[BUFF_SIZE/2];
void *src_buff = buff, *dst_buff;
mlib_s32 extraA;
mlib_s32 dstScan = pDstInfo->scanStride;
mlib_s32 srcScan = pSrcInfo->scanStride;
mlib_s32 log_val[6];
mlib_s32 j;
mlib_s32 SrcOpAnd;
mlib_s32 SrcOpXor;
mlib_s32 SrcOpAdd;
mlib_s32 DstOpAnd;
mlib_s32 DstOpXor;
mlib_s32 DstOpAdd;
mlib_u8 *mul8_extra;
extraA = (mlib_s32)(pCompInfo->details.extraAlpha * 255.0 + 0.5);
mul8_extra = mul8table[extraA];
SrcOpAnd = (AlphaRules[pCompInfo->rule].srcOps).andval;
SrcOpXor = (AlphaRules[pCompInfo->rule].srcOps).xorval;
SrcOpAdd = (AlphaRules[pCompInfo->rule].srcOps).addval;
SrcOpAdd -= SrcOpXor;
DstOpAnd = (AlphaRules[pCompInfo->rule].dstOps).andval;
DstOpXor = (AlphaRules[pCompInfo->rule].dstOps).xorval;
DstOpAdd = (AlphaRules[pCompInfo->rule].dstOps).addval;
DstOpAdd -= DstOpXor;
log_val[0] = SrcOpAnd;
log_val[1] = SrcOpXor;
log_val[2] = SrcOpAdd;
log_val[3] = DstOpAnd;
log_val[4] = DstOpXor;
log_val[5] = DstOpAdd;
vis_write_gsr(7 << 3);
if (2*width > BUFF_SIZE) src_buff = mlib_malloc(2*width*sizeof(mlib_s32));
dst_buff = (mlib_s32*)src_buff + width;
if (pMask != NULL) {
pMask += maskOff;
for (j = 0; j < height; j++) {
IntArgbToIntAbgrConvert_line(srcBase, src_buff, width);
if (!((mlib_s32)dstBase & 3)) {
IntArgbToIntArgbAlphaMaskBlit_line(dstBase, src_buff, pMask,
width, log_val, mul8_extra,
(void*)mul8table);
} else {
mlib_ImageCopy_na(dstBase, dst_buff, width*sizeof(mlib_s32));
IntArgbToIntArgbAlphaMaskBlit_line(dst_buff, src_buff, pMask,
width, log_val, mul8_extra,
(void*)mul8table);
mlib_ImageCopy_na(dst_buff, dstBase, width*sizeof(mlib_s32));
}
PTR_ADD(dstBase, dstScan);
PTR_ADD(srcBase, srcScan);
PTR_ADD(pMask, maskScan);
}
} else {
for (j = 0; j < height; j++) {
IntArgbToIntAbgrConvert_line(srcBase, src_buff, width);
if (!((mlib_s32)dstBase & 3)) {
IntArgbToIntArgbAlphaMaskBlit_A1_line(dstBase, src_buff,
pMask, width, log_val,
mul8_extra,
(void*)mul8table);
} else {
mlib_ImageCopy_na(dstBase, dst_buff, width*sizeof(mlib_s32));
IntArgbToIntArgbAlphaMaskBlit_A1_line(dst_buff, src_buff,
pMask, width, log_val,
mul8_extra,
(void*)mul8table);
mlib_ImageCopy_na(dst_buff, dstBase, width*sizeof(mlib_s32));
}
PTR_ADD(dstBase, dstScan);
PTR_ADD(srcBase, srcScan);
}
}
if (src_buff != buff) {
mlib_free(src_buff);
}
}
/***************************************************************/
/* ##############################################################
* IntArgbToIntRgbAlphaMaskBlit()
*/
#undef MASK_FILL
#define MASK_FILL(rr, pathA, dstA, dstARGB, srcA, srcARGB) \
{ \
mlib_s32 srcF, dstF; \
\
srcA = mul8_extra[srcA]; \
dstF = ((srcA & DstOpAnd) ^ DstOpXor) + DstOpAdd; \
\
srcF = mul8_srcF[pathA]; \
dstA = MUL8_INT(dstF, pathA) + (0xff - pathA); \
\
pathA = dstA - 0xff - srcF; \
/* (pathA == 0) if (dstA == 0xFF && srcF == 0) */ \
\
srcA = MUL8_INT(srcA, srcF); \
\
BLEND_VIS_RGB(rr, dstARGB, srcARGB, dstA, srcA); \
}
/***************************************************************/
static void IntArgbToIntRgbAlphaMaskBlit_line(mlib_f32 *dst_ptr,
mlib_f32 *src_ptr,
mlib_u8 *pMask,
mlib_s32 width,
mlib_s32 *log_val,
mlib_u8 *mul8_extra,
mlib_u8 *mul8_srcF,
mlib_u8 *mul8_tbl)
{
mlib_s32 i, i0;
mlib_s32 pathA0, pathA1, dstA0, dstA1, srcA0, srcA1, msk;
mlib_d64 res0, res1, dstARGB;
mlib_f32 dstARGB0, srcARGB0, srcARGB1;
mlib_s32 DstOpAnd = log_val[3];
mlib_s32 DstOpXor = log_val[4];
mlib_s32 DstOpAdd = log_val[5];
i = i0 = 0;
if ((mlib_s32)dst_ptr & 7) {
pathA0 = pMask[i];
srcA0 = *(mlib_u8*)(src_ptr + i);
dstARGB0 = dst_ptr[i];
srcARGB0 = src_ptr[i];
MASK_FILL(res0, pathA0, dstA0, dstARGB0, srcA0, srcARGB0);
if (pathA0) {
dst_ptr[i] = vis_fpack16(res0);
}
i0 = 1;
}
#pragma pipeloop(0)
for (i = i0; i <= width - 2; i += 2) {
pathA0 = pMask[i];
pathA1 = pMask[i + 1];
dstARGB = *(mlib_d64*)(dst_ptr + i);
srcA0 = *(mlib_u8*)(src_ptr + i);
srcA1 = *(mlib_u8*)(src_ptr + i + 1);
srcARGB0 = src_ptr[i];
srcARGB1 = src_ptr[i + 1];
MASK_FILL(res0, pathA0, dstA0, vis_read_hi(dstARGB), srcA0, srcARGB0);
MASK_FILL(res1, pathA1, dstA1, vis_read_lo(dstARGB), srcA1, srcARGB1);
res0 = vis_fpack16_pair(res0, res1);
msk = (((pathA0) & (1 << 11)) | ((pathA1) & (1 << 10))) >> 10;
vis_pst_32(res0, dst_ptr + i, msk);
}
if (i < width) {
pathA0 = pMask[i];
srcA0 = *(mlib_u8*)(src_ptr + i);
dstARGB0 = dst_ptr[i];
srcARGB0 = src_ptr[i];
MASK_FILL(res0, pathA0, dstA0, dstARGB0, srcA0, srcARGB0);
if (pathA0) {
dst_ptr[i] = vis_fpack16(res0);
}
}
}
/***************************************************************/
#undef MASK_FILL
#define MASK_FILL(rr, pathA, dstA, dstARGB, srcA, srcARGB) \
{ \
srcA = mul8_extra[srcA]; \
dstA = ((srcA & DstOpAnd) ^ DstOpXor) + DstOpAdd; \
\
srcA = mul8_srcF[srcA]; \
\
pathA = dstA - srcF_255; \
/* (pathA == 0) if (dstA == 0xFF && srcF == 0) */ \
\
BLEND_VIS_RGB(rr, dstARGB, srcARGB, dstA, srcA); \
}
/***************************************************************/
static void IntArgbToIntRgbAlphaMaskBlit_A1_line(mlib_f32 *dst_ptr,
mlib_f32 *src_ptr,
mlib_u8 *pMask,
mlib_s32 width,
mlib_s32 *log_val,
mlib_u8 *mul8_extra,
mlib_u8 *mul8_srcF,
mlib_u8 *mul8_tbl)
{
mlib_s32 i, i0;
mlib_s32 pathA0, pathA1, dstA0, dstA1, srcA0, srcA1, msk;
mlib_d64 res0, res1, dstARGB;
mlib_f32 dstARGB0, srcARGB0, srcARGB1;
mlib_s32 DstOpAnd = log_val[3];
mlib_s32 DstOpXor = log_val[4];
mlib_s32 DstOpAdd = log_val[5];
mlib_s32 srcF_255 = mul8_srcF[0xff] + 0xff;
i = i0 = 0;
if ((mlib_s32)dst_ptr & 7) {
srcA0 = *(mlib_u8*)(src_ptr + i);
dstARGB0 = dst_ptr[i];
srcARGB0 = src_ptr[i];
MASK_FILL(res0, pathA0, dstA0, dstARGB0, srcA0, srcARGB0);
if (pathA0) {
dst_ptr[i] = vis_fpack16(res0);
}
i0 = 1;
}
#pragma pipeloop(0)
for (i = i0; i <= width - 2; i += 2) {
dstARGB = *(mlib_d64*)(dst_ptr + i);
srcA0 = *(mlib_u8*)(src_ptr + i);
srcA1 = *(mlib_u8*)(src_ptr + i + 1);
srcARGB0 = src_ptr[i];
srcARGB1 = src_ptr[i + 1];
MASK_FILL(res0, pathA0, dstA0, vis_read_hi(dstARGB), srcA0, srcARGB0);
MASK_FILL(res1, pathA1, dstA1, vis_read_lo(dstARGB), srcA1, srcARGB1);
res0 = vis_fpack16_pair(res0, res1);
msk = (((pathA0) & (1 << 11)) | ((pathA1) & (1 << 10))) >> 10;
vis_pst_32(res0, dst_ptr + i, msk);
}
if (i < width) {
srcA0 = *(mlib_u8*)(src_ptr + i);
dstARGB0 = dst_ptr[i];
srcARGB0 = src_ptr[i];
MASK_FILL(res0, pathA0, dstA0, dstARGB0, srcA0, srcARGB0);
if (pathA0) {
dst_ptr[i] = vis_fpack16(res0);
}
}
}
/***************************************************************/
void ADD_SUFF(IntArgbToIntRgbAlphaMaskBlit)(MASKBLIT_PARAMS)
{
mlib_s32 extraA, srcF;
mlib_s32 dstScan = pDstInfo->scanStride;
mlib_s32 srcScan = pSrcInfo->scanStride;
mlib_s32 log_val[6];
mlib_s32 j;
mlib_s32 SrcOpAnd;
mlib_s32 SrcOpXor;
mlib_s32 SrcOpAdd;
mlib_s32 DstOpAnd;
mlib_s32 DstOpXor;
mlib_s32 DstOpAdd;
mlib_u8 *mul8_extra, *mul8_srcF;
extraA = (mlib_s32)(pCompInfo->details.extraAlpha * 255.0 + 0.5);
mul8_extra = mul8table[extraA];
SrcOpAnd = (AlphaRules[pCompInfo->rule].srcOps).andval;
SrcOpXor = (AlphaRules[pCompInfo->rule].srcOps).xorval;
SrcOpAdd = (AlphaRules[pCompInfo->rule].srcOps).addval;
SrcOpAdd -= SrcOpXor;
DstOpAnd = (AlphaRules[pCompInfo->rule].dstOps).andval;
DstOpXor = (AlphaRules[pCompInfo->rule].dstOps).xorval;
DstOpAdd = (AlphaRules[pCompInfo->rule].dstOps).addval;
DstOpAdd -= DstOpXor;
log_val[3] = DstOpAnd;
log_val[4] = DstOpXor;
log_val[5] = DstOpAdd;
srcF = ((0xff & SrcOpAnd) ^ SrcOpXor) + SrcOpAdd;
mul8_srcF = mul8table[srcF];
vis_write_gsr(7 << 3);
if (pMask != NULL) {
pMask += maskOff;
if (dstScan == 4*width && srcScan == dstScan && maskScan == width) {
width *= height;
height = 1;
}
for (j = 0; j < height; j++) {
IntArgbToIntRgbAlphaMaskBlit_line(dstBase, srcBase, pMask,
width, log_val, mul8_extra,
mul8_srcF, (void*)mul8table);
PTR_ADD(dstBase, dstScan);
PTR_ADD(srcBase, srcScan);
PTR_ADD(pMask, maskScan);
}
} else {
if (dstScan == 4*width && srcScan == dstScan) {
width *= height;
height = 1;
}
for (j = 0; j < height; j++) {
IntArgbToIntRgbAlphaMaskBlit_A1_line(dstBase, srcBase, pMask,
width, log_val, mul8_extra,
mul8_srcF, (void*)mul8table);
PTR_ADD(dstBase, dstScan);
PTR_ADD(srcBase, srcScan);
}
}
}
/***************************************************************/
/* ##############################################################
* IntRgbToIntArgbAlphaMaskBlit()
*/
#undef MASK_FILL
#define MASK_FILL(rr, pathA, dstA, dstARGB, srcAX, srcARGB) \
{ \
mlib_s32 pathAx256 = pathA << 8; \
srcF = ((dstA & SrcOpAnd) ^ SrcOpXor) + SrcOpAdd; \
\
srcF = mul8_tbl[pathAx256 + srcF]; \
dstFX = mul8_tbl[pathAx256 + dstF] + (0xff - pathA); \
\
srcAX = mul8_tbl[srcF + srcAx256]; \
dstA = mul8_tbl[dstFX + (dstA << 8)]; \
\
BLEND_VIS(rr, dstARGB, srcARGB, dstA, srcAX); \
}
/***************************************************************/
static void IntRgbToIntArgbAlphaMaskBlit_line(mlib_f32 *dst_ptr,
mlib_f32 *src_ptr,
mlib_u8 *pMask,
mlib_s32 width,
mlib_s32 *log_val,
mlib_u8 *mul8_extra,
mlib_u8 *mul8_tbl)
{
mlib_s32 i, i0;
mlib_s32 pathA0, pathA1, dstA0, dstA1, srcA, srcA0, srcA1, msk;
mlib_d64 res0, res1, dstARGB;
mlib_f32 dstARGB0, srcARGB0, srcARGB1;
mlib_s32 SrcOpAnd = log_val[0];
mlib_s32 SrcOpXor = log_val[1];
mlib_s32 SrcOpAdd = log_val[2];
mlib_s32 DstOpAnd = log_val[3];
mlib_s32 DstOpXor = log_val[4];
mlib_s32 DstOpAdd = log_val[5];
mlib_s32 srcF, dstF, dstFX, srcAx256;
i = i0 = 0;
srcA = 0xFF;
srcA = mul8_extra[srcA];
srcAx256 = srcA << 8;
dstF = ((srcA & DstOpAnd) ^ DstOpXor) + DstOpAdd;
if ((mlib_s32)dst_ptr & 7) {
pathA0 = pMask[i];
if (pathA0) {
dstA0 = *(mlib_u8*)(dst_ptr + i);
dstARGB0 = dst_ptr[i];
srcARGB0 = src_ptr[i];
MASK_FILL(res0, pathA0, dstA0, dstARGB0, srcA0, srcARGB0);
dst_ptr[i] = vis_fpack16(res0);
*(mlib_u8*)(dst_ptr + i) = dstA0;
}
i0 = 1;
}
#pragma pipeloop(0)
for (i = i0; i <= width - 2; i += 2) {
pathA0 = pMask[i];
pathA1 = pMask[i + 1];
dstA0 = *(mlib_u8*)(dst_ptr + i);
dstA1 = *(mlib_u8*)(dst_ptr + i + 1);
dstARGB = *(mlib_d64*)(dst_ptr + i);
srcARGB0 = src_ptr[i];
srcARGB1 = src_ptr[i + 1];
MASK_FILL(res0, pathA0, dstA0, vis_read_hi(dstARGB), srcA0, srcARGB0);
MASK_FILL(res1, pathA1, dstA1, vis_read_lo(dstARGB), srcA1, srcARGB1);
res0 = vis_fpack16_pair(res0, res1);
msk = (((-pathA0) & (1 << 11)) | ((-pathA1) & (1 << 10))) >> 10;
vis_pst_32(res0, dst_ptr + i, msk);
*(mlib_u8*)(dst_ptr + i ) = dstA0;
*(mlib_u8*)(dst_ptr + i + 1) = dstA1;
}
if (i < width) {
pathA0 = pMask[i];
if (pathA0) {
dstA0 = *(mlib_u8*)(dst_ptr + i);
dstARGB0 = dst_ptr[i];
srcARGB0 = src_ptr[i];
MASK_FILL(res0, pathA0, dstA0, dstARGB0, srcA0, srcARGB0);
dst_ptr[i] = vis_fpack16(res0);
*(mlib_u8*)(dst_ptr + i) = dstA0;
}
}
}
/***************************************************************/
#undef MASK_FILL
#define MASK_FILL(rr, pathA, dstA, dstARGB, srcA, srcARGB) \
{ \
srcF = ((dstA & SrcOpAnd) ^ SrcOpXor) + SrcOpAdd; \
\
srcA = mul8_tbl[srcF + srcAx256]; \
dstA = mul8_tbl[dstF + (dstA << 8)]; \
\
BLEND_VIS(rr, dstARGB, srcARGB, dstA, srcA); \
}
/***************************************************************/
static void IntRgbToIntArgbAlphaMaskBlit_A1_line(mlib_f32 *dst_ptr,
mlib_f32 *src_ptr,
mlib_u8 *pMask,
mlib_s32 width,
mlib_s32 *log_val,
mlib_u8 *mul8_extra,
mlib_u8 *mul8_tbl)
{
mlib_s32 i;
mlib_s32 dstA0, srcA, srcA0;
mlib_d64 res0;
mlib_f32 dstARGB0, srcARGB0;
mlib_s32 SrcOpAnd = log_val[0];
mlib_s32 SrcOpXor = log_val[1];
mlib_s32 SrcOpAdd = log_val[2];
mlib_s32 DstOpAnd = log_val[3];
mlib_s32 DstOpXor = log_val[4];
mlib_s32 DstOpAdd = log_val[5];
mlib_s32 srcF, dstF, srcAx256;
srcA = 0xFF;
srcA = mul8_extra[srcA];
srcAx256 = srcA << 8;
dstF = ((srcA & DstOpAnd) ^ DstOpXor) + DstOpAdd;
#pragma pipeloop(0)
for (i = 0; i < width; i++) {
dstA0 = *(mlib_u8*)(dst_ptr + i);
dstARGB0 = dst_ptr[i];
srcARGB0 = src_ptr[i];
MASK_FILL(res0, pathA0, dstA0, dstARGB0, srcA0, srcARGB0);
dst_ptr[i] = vis_fpack16(res0);
*(mlib_u8*)(dst_ptr + i) = dstA0;
}
}
/***************************************************************/
void ADD_SUFF(IntRgbToIntArgbAlphaMaskBlit)(MASKBLIT_PARAMS)
{
mlib_s32 extraA;
mlib_s32 dstScan = pDstInfo->scanStride;
mlib_s32 srcScan = pSrcInfo->scanStride;
mlib_s32 log_val[6];
mlib_s32 j;
mlib_s32 SrcOpAnd;
mlib_s32 SrcOpXor;
mlib_s32 SrcOpAdd;
mlib_s32 DstOpAnd;
mlib_s32 DstOpXor;
mlib_s32 DstOpAdd;
mlib_u8 *mul8_extra;
extraA = (mlib_s32)(pCompInfo->details.extraAlpha * 255.0 + 0.5);
mul8_extra = mul8table[extraA];
SrcOpAnd = (AlphaRules[pCompInfo->rule].srcOps).andval;
SrcOpXor = (AlphaRules[pCompInfo->rule].srcOps).xorval;
SrcOpAdd = (AlphaRules[pCompInfo->rule].srcOps).addval;
SrcOpAdd -= SrcOpXor;
DstOpAnd = (AlphaRules[pCompInfo->rule].dstOps).andval;
DstOpXor = (AlphaRules[pCompInfo->rule].dstOps).xorval;
DstOpAdd = (AlphaRules[pCompInfo->rule].dstOps).addval;
DstOpAdd -= DstOpXor;
log_val[0] = SrcOpAnd;
log_val[1] = SrcOpXor;
log_val[2] = SrcOpAdd;
log_val[3] = DstOpAnd;
log_val[4] = DstOpXor;
log_val[5] = DstOpAdd;
vis_write_gsr(7 << 3);
if (pMask != NULL) {
pMask += maskOff;
if (dstScan == 4*width && srcScan == dstScan && maskScan == width) {
width *= height;
height = 1;
}
for (j = 0; j < height; j++) {
IntRgbToIntArgbAlphaMaskBlit_line(dstBase, srcBase, pMask,
width, log_val, mul8_extra,
(void*)mul8table);
PTR_ADD(dstBase, dstScan);
PTR_ADD(srcBase, srcScan);
PTR_ADD(pMask, maskScan);
}
} else {
if (dstScan == 4*width && srcScan == dstScan) {
width *= height;
height = 1;
}
for (j = 0; j < height; j++) {
IntRgbToIntArgbAlphaMaskBlit_A1_line(dstBase, srcBase, pMask,
width, log_val, mul8_extra,
(void*)mul8table);
PTR_ADD(dstBase, dstScan);
PTR_ADD(srcBase, srcScan);
}
}
}
/***************************************************************/
void ADD_SUFF(IntRgbToFourByteAbgrAlphaMaskBlit)(MASKBLIT_PARAMS)
{
mlib_d64 buff[BUFF_SIZE/2];
void *src_buff = buff, *dst_buff;
mlib_s32 extraA;
mlib_s32 dstScan = pDstInfo->scanStride;
mlib_s32 srcScan = pSrcInfo->scanStride;
mlib_s32 log_val[6];
mlib_s32 j;
mlib_s32 SrcOpAnd;
mlib_s32 SrcOpXor;
mlib_s32 SrcOpAdd;
mlib_s32 DstOpAnd;
mlib_s32 DstOpXor;
mlib_s32 DstOpAdd;
mlib_u8 *mul8_extra;
extraA = (mlib_s32)(pCompInfo->details.extraAlpha * 255.0 + 0.5);
mul8_extra = mul8table[extraA];
SrcOpAnd = (AlphaRules[pCompInfo->rule].srcOps).andval;
SrcOpXor = (AlphaRules[pCompInfo->rule].srcOps).xorval;
SrcOpAdd = (AlphaRules[pCompInfo->rule].srcOps).addval;
SrcOpAdd -= SrcOpXor;
DstOpAnd = (AlphaRules[pCompInfo->rule].dstOps).andval;
DstOpXor = (AlphaRules[pCompInfo->rule].dstOps).xorval;
DstOpAdd = (AlphaRules[pCompInfo->rule].dstOps).addval;
DstOpAdd -= DstOpXor;
log_val[0] = SrcOpAnd;
log_val[1] = SrcOpXor;
log_val[2] = SrcOpAdd;
log_val[3] = DstOpAnd;
log_val[4] = DstOpXor;
log_val[5] = DstOpAdd;
vis_write_gsr(7 << 3);
if (2*width > BUFF_SIZE) src_buff = mlib_malloc(2*width*sizeof(mlib_s32));
dst_buff = (mlib_s32*)src_buff + width;
if (pMask != NULL) {
pMask += maskOff;
for (j = 0; j < height; j++) {
IntArgbToIntAbgrConvert_line(srcBase, src_buff, width);
if (!((mlib_s32)dstBase & 3)) {
IntRgbToIntArgbAlphaMaskBlit_line(dstBase, src_buff, pMask,
width, log_val, mul8_extra,
(void*)mul8table);
} else {
mlib_ImageCopy_na(dstBase, dst_buff, width*sizeof(mlib_s32));
IntRgbToIntArgbAlphaMaskBlit_line(dst_buff, src_buff, pMask,
width, log_val, mul8_extra,
(void*)mul8table);
mlib_ImageCopy_na(dst_buff, dstBase, width*sizeof(mlib_s32));
}
PTR_ADD(dstBase, dstScan);
PTR_ADD(srcBase, srcScan);
PTR_ADD(pMask, maskScan);
}
} else {
for (j = 0; j < height; j++) {
IntArgbToIntAbgrConvert_line(srcBase, src_buff, width);
if (!((mlib_s32)dstBase & 3)) {
IntRgbToIntArgbAlphaMaskBlit_A1_line(dstBase, src_buff, pMask,
width, log_val,
mul8_extra,
(void*)mul8table);
} else {
mlib_ImageCopy_na(dstBase, dst_buff, width*sizeof(mlib_s32));
IntRgbToIntArgbAlphaMaskBlit_A1_line(dst_buff, src_buff, pMask,
width, log_val,
mul8_extra,
(void*)mul8table);
mlib_ImageCopy_na(dst_buff, dstBase, width*sizeof(mlib_s32));
}
PTR_ADD(dstBase, dstScan);
PTR_ADD(srcBase, srcScan);
}
}
if (src_buff != buff) {
mlib_free(src_buff);
}
}
/***************************************************************/
/* ##############################################################
* IntArgbToIntBgrAlphaMaskBlit()
*/
#undef MASK_FILL
#define MASK_FILL(rr, pathA, dstA, dstARGB, srcA, srcARGB) \
srcA = mul8_extra[srcA]; \
dstF = ((srcA & DstOpAnd) ^ DstOpXor) + DstOpAdd; \
\
srcF = mul8_srcF[pathA]; \
dstA = mul8_tbl[(pathA << 8) + dstF] + (0xff - pathA); \
\
pathA = dstA - 0xff - srcF; \
/* (pathA == 0) if (dstA == 0xFF && srcF == 0) */ \
\
srcA = MUL8_INT(srcA, srcF); \
\
BLEND_VIS_RGB(rr, dstARGB, srcARGB, dstA, srcA)
/***************************************************************/
static void IntArgbToIntBgrAlphaMaskBlit_line(mlib_f32 *dst_ptr,
mlib_f32 *src_ptr,
mlib_u8 *pMask,
mlib_s32 width,
mlib_s32 *log_val,
mlib_u8 *mul8_extra,
mlib_u8 *mul8_srcF,
mlib_u8 *mul8_tbl)
{
mlib_s32 i, i0;
mlib_s32 pathA0, pathA1, dstA0, dstA1, srcA0, srcA1, msk;
mlib_d64 res0, res1, dstARGB, srcARGB;
mlib_f32 dstARGB0, srcARGB0;
mlib_s32 DstOpAnd = log_val[3];
mlib_s32 DstOpXor = log_val[4];
mlib_s32 DstOpAdd = log_val[5];
mlib_s32 srcF, dstF;
#if VIS >= 0x200
vis_write_bmask(0x03214765, 0);
#endif
i = i0 = 0;
if ((mlib_s32)dst_ptr & 7) {
pathA0 = pMask[i];
srcA0 = *(mlib_u8*)(src_ptr + i);
dstARGB0 = dst_ptr[i];
srcARGB0 = src_ptr[i];
ARGB2ABGR_FL(srcARGB0)
MASK_FILL(res0, pathA0, dstA0, dstARGB0, srcA0, srcARGB0);
if (pathA0) {
dst_ptr[i] = vis_fpack16(res0);
}
i0 = 1;
}
#pragma pipeloop(0)
for (i = i0; i <= width - 2; i += 2) {
pathA0 = pMask[i];
pathA1 = pMask[i + 1];
dstARGB = *(mlib_d64*)(dst_ptr + i);
srcA0 = *(mlib_u8*)(src_ptr + i);
srcA1 = *(mlib_u8*)(src_ptr + i + 1);
srcARGB = vis_freg_pair(src_ptr[i], src_ptr[i + 1]);
ARGB2ABGR_DB(srcARGB)
MASK_FILL(res0, pathA0, dstA0, vis_read_hi(dstARGB),
srcA0, vis_read_hi(srcARGB));
MASK_FILL(res1, pathA1, dstA1, vis_read_lo(dstARGB),
srcA1, vis_read_lo(srcARGB));
res0 = vis_fpack16_pair(res0, res1);
msk = (((pathA0) & (1 << 11)) | ((pathA1) & (1 << 10))) >> 10;
vis_pst_32(res0, dst_ptr + i, msk);
}
if (i < width) {
pathA0 = pMask[i];
srcA0 = *(mlib_u8*)(src_ptr + i);
dstARGB0 = dst_ptr[i];
srcARGB0 = src_ptr[i];
ARGB2ABGR_FL(srcARGB0)
MASK_FILL(res0, pathA0, dstA0, dstARGB0, srcA0, srcARGB0);
if (pathA0) {
dst_ptr[i] = vis_fpack16(res0);
}
}
}
/***************************************************************/
#undef MASK_FILL
#define MASK_FILL(rr, pathA, dstA, dstARGB, srcA, srcARGB) \
srcA = mul8_extra[srcA]; \
dstA = ((srcA & DstOpAnd) ^ DstOpXor) + DstOpAdd; \
\
srcA = mul8_srcF[srcA]; \
\
pathA = dstA - srcF_255; \
/* (pathA == 0) if (dstA == 0xFF && srcF == 0) */ \
\
BLEND_VIS(rr, dstARGB, srcARGB, dstA, srcA)
/***************************************************************/
static void IntArgbToIntBgrAlphaMaskBlit_A1_line(mlib_f32 *dst_ptr,
mlib_f32 *src_ptr,
mlib_u8 *pMask,
mlib_s32 width,
mlib_s32 *log_val,
mlib_u8 *mul8_extra,
mlib_u8 *mul8_srcF,
mlib_u8 *mul8_tbl)
{
mlib_s32 i, i0;
mlib_s32 pathA0, pathA1, dstA0, dstA1, srcA0, srcA1, msk;
mlib_d64 res0, res1, dstARGB, srcARGB;
mlib_f32 dstARGB0, srcARGB0;
mlib_s32 DstOpAnd = log_val[3];
mlib_s32 DstOpXor = log_val[4];
mlib_s32 DstOpAdd = log_val[5];
mlib_s32 srcF_255 = mul8_srcF[0xff] + 0xff;
#if VIS >= 0x200
vis_write_bmask(0x03214765, 0);
#endif
i = i0 = 0;
if ((mlib_s32)dst_ptr & 7) {
srcA0 = *(mlib_u8*)(src_ptr + i);
dstARGB0 = dst_ptr[i];
srcARGB0 = src_ptr[i];
ARGB2ABGR_FL(srcARGB0)
MASK_FILL(res0, pathA0, dstA0, dstARGB0, srcA0, srcARGB0);
if (pathA0) {
dst_ptr[i] = vis_fpack16(res0);
}
i0 = 1;
}
#pragma pipeloop(0)
for (i = i0; i <= width - 2; i += 2) {
dstARGB = *(mlib_d64*)(dst_ptr + i);
srcA0 = *(mlib_u8*)(src_ptr + i);
srcA1 = *(mlib_u8*)(src_ptr + i + 1);
srcARGB = vis_freg_pair(src_ptr[i], src_ptr[i + 1]);
ARGB2ABGR_DB(srcARGB)
MASK_FILL(res0, pathA0, dstA0, vis_read_hi(dstARGB),
srcA0, vis_read_hi(srcARGB));
MASK_FILL(res1, pathA1, dstA1, vis_read_lo(dstARGB),
srcA1, vis_read_lo(srcARGB));
res0 = vis_fpack16_pair(res0, res1);
msk = (((pathA0) & (1 << 11)) | ((pathA1) & (1 << 10))) >> 10;
vis_pst_32(res0, dst_ptr + i, msk);
}
if (i < width) {
srcA0 = *(mlib_u8*)(src_ptr + i);
dstARGB0 = dst_ptr[i];
srcARGB0 = src_ptr[i];
ARGB2ABGR_FL(srcARGB0)
MASK_FILL(res0, pathA0, dstA0, dstARGB0, srcA0, srcARGB0);
if (pathA0) {
dst_ptr[i] = vis_fpack16(res0);
}
}
}
/***************************************************************/
void ADD_SUFF(IntArgbToIntBgrAlphaMaskBlit)(MASKBLIT_PARAMS)
{
mlib_s32 extraA, srcF;
mlib_s32 dstScan = pDstInfo->scanStride;
mlib_s32 srcScan = pSrcInfo->scanStride;
mlib_s32 log_val[6];
mlib_s32 j;
mlib_s32 SrcOpAnd;
mlib_s32 SrcOpXor;
mlib_s32 SrcOpAdd;
mlib_s32 DstOpAnd;
mlib_s32 DstOpXor;
mlib_s32 DstOpAdd;
mlib_u8 *mul8_extra, *mul8_srcF;
extraA = (mlib_s32)(pCompInfo->details.extraAlpha * 255.0 + 0.5);
mul8_extra = mul8table[extraA];
SrcOpAnd = (AlphaRules[pCompInfo->rule].srcOps).andval;
SrcOpXor = (AlphaRules[pCompInfo->rule].srcOps).xorval;
SrcOpAdd = (AlphaRules[pCompInfo->rule].srcOps).addval;
SrcOpAdd -= SrcOpXor;
DstOpAnd = (AlphaRules[pCompInfo->rule].dstOps).andval;
DstOpXor = (AlphaRules[pCompInfo->rule].dstOps).xorval;
DstOpAdd = (AlphaRules[pCompInfo->rule].dstOps).addval;
DstOpAdd -= DstOpXor;
log_val[3] = DstOpAnd;
log_val[4] = DstOpXor;
log_val[5] = DstOpAdd;
srcF = ((0xff & SrcOpAnd) ^ SrcOpXor) + SrcOpAdd;
mul8_srcF = mul8table[srcF];
vis_write_gsr(7 << 3);
if (pMask != NULL) {
if (dstScan == 4*width && srcScan == dstScan && maskScan == width) {
width *= height;
height = 1;
}
pMask += maskOff;
for (j = 0; j < height; j++) {
IntArgbToIntBgrAlphaMaskBlit_line(dstBase, srcBase, pMask,
width, log_val, mul8_extra,
mul8_srcF, (void*)mul8table);
PTR_ADD(dstBase, dstScan);
PTR_ADD(srcBase, srcScan);
PTR_ADD(pMask, maskScan);
}
} else {
if (dstScan == 4*width && srcScan == dstScan) {
width *= height;
height = 1;
}
for (j = 0; j < height; j++) {
IntArgbToIntBgrAlphaMaskBlit_A1_line(dstBase, srcBase, pMask,
width, log_val, mul8_extra,
mul8_srcF, (void*)mul8table);
PTR_ADD(dstBase, dstScan);
PTR_ADD(srcBase, srcScan);
}
}
}
/***************************************************************/
/* ##############################################################
* IntRgbToIntRgbAlphaMaskBlit()
* IntRgbToIntBgrAlphaMaskBlit()
* IntBgrToIntBgrAlphaMaskBlit()
*/
#undef MASK_FILL
#define MASK_FILL(rr, pathA, dstA, dstARGB, srcAX, srcARGB) \
srcF = mul8_srcF[pathA]; \
dstA = mul8_tbl[(pathA << 8) + dstF] + (0xff - pathA); \
pathA = dstA - 0xff - srcF; \
srcAX = mul8_tbl[srcA + (srcF << 8)]; \
\
BLEND_VIS_RGB(rr, dstARGB, srcARGB, dstA, srcAX)
/***************************************************************/
static void IntRgbToIntRgbAlphaMaskBlit_line(mlib_f32 *dst_ptr,
mlib_f32 *src_ptr,
mlib_u8 *pMask,
mlib_s32 width,
mlib_s32 *log_val,
mlib_u8 *mul8_extra,
mlib_u8 *mul8_srcF,
mlib_u8 *mul8_tbl)
{
mlib_s32 i, i0;
mlib_s32 pathA0, pathA1, dstA0, dstA1, srcA, srcA0, srcA1, msk;
mlib_d64 res0, res1, dstARGB;
mlib_f32 dstARGB0, srcARGB0, srcARGB1;
mlib_s32 DstOpAnd = log_val[3];
mlib_s32 DstOpXor = log_val[4];
mlib_s32 DstOpAdd = log_val[5];
mlib_s32 srcF, dstF;
i = i0 = 0;
srcA = 0xFF;
srcA = mul8_extra[srcA];
dstF = ((srcA & DstOpAnd) ^ DstOpXor) + DstOpAdd;
if ((mlib_s32)dst_ptr & 7) {
pathA0 = pMask[i];
dstARGB0 = dst_ptr[i];
srcARGB0 = src_ptr[i];
MASK_FILL(res0, pathA0, dstA0, dstARGB0, srcA0, srcARGB0);
if (pathA0) {
dst_ptr[i] = vis_fpack16(res0);
}
i0 = 1;
}
#pragma pipeloop(0)
for (i = i0; i <= width - 2; i += 2) {
pathA0 = pMask[i];
pathA1 = pMask[i + 1];
dstARGB = *(mlib_d64*)(dst_ptr + i);
srcARGB0 = src_ptr[i];
srcARGB1 = src_ptr[i + 1];
MASK_FILL(res0, pathA0, dstA0, vis_read_hi(dstARGB), srcA0, srcARGB0);
MASK_FILL(res1, pathA1, dstA1, vis_read_lo(dstARGB), srcA1, srcARGB1);
res0 = vis_fpack16_pair(res0, res1);
msk = (((pathA0) & (1 << 11)) | ((pathA1) & (1 << 10))) >> 10;
vis_pst_32(res0, dst_ptr + i, msk);
}
if (i < width) {
pathA0 = pMask[i];
dstARGB0 = dst_ptr[i];
srcARGB0 = src_ptr[i];
MASK_FILL(res0, pathA0, dstA0, dstARGB0, srcA0, srcARGB0);
if (pathA0) {
dst_ptr[i] = vis_fpack16(res0);
}
}
}
/***************************************************************/
static void IntRgbToIntBgrAlphaMaskBlit_line(mlib_f32 *dst_ptr,
mlib_f32 *src_ptr,
mlib_u8 *pMask,
mlib_s32 width,
mlib_s32 *log_val,
mlib_u8 *mul8_extra,
mlib_u8 *mul8_srcF,
mlib_u8 *mul8_tbl)
{
mlib_s32 i, i0;
mlib_s32 pathA0, pathA1, dstA0, dstA1, srcA, srcA0, srcA1, msk;
mlib_d64 res0, res1, dstARGB, srcARGB;
mlib_f32 dstARGB0, srcARGB0;
mlib_s32 DstOpAnd = log_val[3];
mlib_s32 DstOpXor = log_val[4];
mlib_s32 DstOpAdd = log_val[5];
mlib_s32 srcF, dstF;
#if VIS >= 0x200
vis_write_bmask(0x03214765, 0);
#endif
i = i0 = 0;
srcA = 0xFF;
srcA = mul8_extra[srcA];
dstF = ((srcA & DstOpAnd) ^ DstOpXor) + DstOpAdd;
if ((mlib_s32)dst_ptr & 7) {
pathA0 = pMask[i];
dstARGB0 = dst_ptr[i];
srcARGB0 = src_ptr[i];
ARGB2ABGR_FL(srcARGB0)
MASK_FILL(res0, pathA0, dstA0, dstARGB0, srcA0, srcARGB0);
if (pathA0) {
dst_ptr[i] = vis_fpack16(res0);
}
i0 = 1;
}
#pragma pipeloop(0)
for (i = i0; i <= width - 2; i += 2) {
pathA0 = pMask[i];
pathA1 = pMask[i + 1];
dstARGB = *(mlib_d64*)(dst_ptr + i);
srcARGB = vis_freg_pair(src_ptr[i], src_ptr[i + 1]);
ARGB2ABGR_DB(srcARGB)
MASK_FILL(res0, pathA0, dstA0, vis_read_hi(dstARGB),
srcA0, vis_read_hi(srcARGB));
MASK_FILL(res1, pathA1, dstA1, vis_read_lo(dstARGB),
srcA1, vis_read_lo(srcARGB));
res0 = vis_fpack16_pair(res0, res1);
msk = (((pathA0) & (1 << 11)) | ((pathA1) & (1 << 10))) >> 10;
vis_pst_32(res0, dst_ptr + i, msk);
}
if (i < width) {
pathA0 = pMask[i];
dstARGB0 = dst_ptr[i];
srcARGB0 = src_ptr[i];
ARGB2ABGR_FL(srcARGB0)
MASK_FILL(res0, pathA0, dstA0, dstARGB0, srcA0, srcARGB0);
if (pathA0) {
dst_ptr[i] = vis_fpack16(res0);
}
}
}
/***************************************************************/
#undef MASK_FILL
#define MASK_FILL(rr, dstARGB, srcARGB) \
t0 = vis_fmul8x16al(srcARGB, srcA_mul); \
t1 = vis_fmul8x16al(dstARGB, dstA_mul); \
rr = vis_fpadd16(t0, t1); \
rr = vis_fpadd16(vis_fmul8sux16(rr, dstA_div), \
vis_fmul8ulx16(rr, dstA_div))
/***************************************************************/
static void IntRgbToIntRgbAlphaMaskBlit_A1_line(mlib_f32 *dst_ptr,
mlib_f32 *src_ptr,
mlib_u8 *pMask,
mlib_s32 width,
mlib_s32 *log_val,
mlib_u8 *mul8_extra,
mlib_u8 *mul8_srcF,
mlib_u8 *mul8_tbl)
{
mlib_s32 i, i0;
mlib_s32 pathA, dstA, srcA, msk;
mlib_d64 res0, res1, dstARGB;
mlib_f32 dstARGB0, srcARGB0, srcARGB1, srcA_mul, dstA_mul;
mlib_s32 DstOpAnd = log_val[3];
mlib_s32 DstOpXor = log_val[4];
mlib_s32 DstOpAdd = log_val[5];
mlib_s32 srcF_255 = mul8_srcF[0xff] + 0xff;
mlib_d64 t0, t1, dstA_div;
i = i0 = 0;
srcA = 0xFF;
srcA = mul8_extra[srcA];
dstA = ((srcA & DstOpAnd) ^ DstOpXor) + DstOpAdd;
srcA = mul8_srcF[srcA];
pathA = dstA - srcF_255;
srcA_mul = ((mlib_f32*)vis_mul8s_tbl)[srcA];
dstA_mul = ((mlib_f32*)vis_mul8s_tbl)[dstA];
dstA += srcA;
dstA_div = ((mlib_d64*)vis_div8_tbl)[dstA];
if ((mlib_s32)dst_ptr & 7) {
dstARGB0 = dst_ptr[i];
srcARGB0 = src_ptr[i];
MASK_FILL(res0, dstARGB0, srcARGB0);
if (pathA) {
dst_ptr[i] = vis_fpack16(res0);
}
i0 = 1;
}
#pragma pipeloop(0)
for (i = i0; i <= width - 2; i += 2) {
dstARGB = *(mlib_d64*)(dst_ptr + i);
srcARGB0 = src_ptr[i];
srcARGB1 = src_ptr[i + 1];
MASK_FILL(res0, vis_read_hi(dstARGB), srcARGB0);
MASK_FILL(res1, vis_read_lo(dstARGB), srcARGB1);
res0 = vis_fpack16_pair(res0, res1);
msk = (((pathA) & (1 << 11)) | ((pathA) & (1 << 10))) >> 10;
vis_pst_32(res0, dst_ptr + i, msk);
}
if (i < width) {
dstARGB0 = dst_ptr[i];
srcARGB0 = src_ptr[i];
MASK_FILL(res0, dstARGB0, srcARGB0);
if (pathA) {
dst_ptr[i] = vis_fpack16(res0);
}
}
}
/***************************************************************/
static void IntRgbToIntBgrAlphaMaskBlit_A1_line(mlib_f32 *dst_ptr,
mlib_f32 *src_ptr,
mlib_u8 *pMask,
mlib_s32 width,
mlib_s32 *log_val,
mlib_u8 *mul8_extra,
mlib_u8 *mul8_srcF,
mlib_u8 *mul8_tbl)
{
mlib_s32 i, i0;
mlib_s32 pathA, dstA, srcA, msk;
mlib_d64 res0, res1, dstARGB, srcARGB;
mlib_f32 dstARGB0, srcARGB0, srcA_mul, dstA_mul;
mlib_s32 DstOpAnd = log_val[3];
mlib_s32 DstOpXor = log_val[4];
mlib_s32 DstOpAdd = log_val[5];
mlib_s32 srcF_255 = mul8_srcF[0xff] + 0xff;
mlib_d64 t0, t1, dstA_div;
#if VIS >= 0x200
vis_write_bmask(0x03214765, 0);
#endif
i = i0 = 0;
srcA = 0xFF;
srcA = mul8_extra[srcA];
dstA = ((srcA & DstOpAnd) ^ DstOpXor) + DstOpAdd;
srcA = mul8_srcF[srcA];
pathA = dstA - srcF_255;
srcA_mul = ((mlib_f32*)vis_mul8s_tbl)[srcA];
dstA_mul = ((mlib_f32*)vis_mul8s_tbl)[dstA];
dstA += srcA;
dstA_div = ((mlib_d64*)vis_div8_tbl)[dstA];
if ((mlib_s32)dst_ptr & 7) {
dstARGB0 = dst_ptr[i];
srcARGB0 = src_ptr[i];
ARGB2ABGR_FL(srcARGB0)
MASK_FILL(res0, dstARGB0, srcARGB0);
if (pathA) {
dst_ptr[i] = vis_fpack16(res0);
}
i0 = 1;
}
#pragma pipeloop(0)
for (i = i0; i <= width - 2; i += 2) {
dstARGB = *(mlib_d64*)(dst_ptr + i);
srcARGB = vis_freg_pair(src_ptr[i], src_ptr[i + 1]);
ARGB2ABGR_DB(srcARGB)
MASK_FILL(res0, vis_read_hi(dstARGB), vis_read_hi(srcARGB));
MASK_FILL(res1, vis_read_lo(dstARGB), vis_read_lo(srcARGB));
res0 = vis_fpack16_pair(res0, res1);
msk = (((pathA) & (1 << 11)) | ((pathA) & (1 << 10))) >> 10;
vis_pst_32(res0, dst_ptr + i, msk);
}
if (i < width) {
dstARGB0 = dst_ptr[i];
srcARGB0 = src_ptr[i];
ARGB2ABGR_FL(srcARGB0)
MASK_FILL(res0, dstARGB0, srcARGB0);
if (pathA) {
dst_ptr[i] = vis_fpack16(res0);
}
}
}
/***************************************************************/
void ADD_SUFF(IntRgbToIntRgbAlphaMaskBlit)(MASKBLIT_PARAMS)
{
mlib_s32 extraA, srcF;
mlib_s32 dstScan = pDstInfo->scanStride;
mlib_s32 srcScan = pSrcInfo->scanStride;
mlib_s32 log_val[6];
mlib_s32 j;
mlib_s32 SrcOpAnd;
mlib_s32 SrcOpXor;
mlib_s32 SrcOpAdd;
mlib_s32 DstOpAnd;
mlib_s32 DstOpXor;
mlib_s32 DstOpAdd;
mlib_u8 *mul8_extra, *mul8_srcF;
extraA = (mlib_s32)(pCompInfo->details.extraAlpha * 255.0 + 0.5);
mul8_extra = mul8table[extraA];
SrcOpAnd = (AlphaRules[pCompInfo->rule].srcOps).andval;
SrcOpXor = (AlphaRules[pCompInfo->rule].srcOps).xorval;
SrcOpAdd = (AlphaRules[pCompInfo->rule].srcOps).addval;
SrcOpAdd -= SrcOpXor;
DstOpAnd = (AlphaRules[pCompInfo->rule].dstOps).andval;
DstOpXor = (AlphaRules[pCompInfo->rule].dstOps).xorval;
DstOpAdd = (AlphaRules[pCompInfo->rule].dstOps).addval;
DstOpAdd -= DstOpXor;
log_val[3] = DstOpAnd;
log_val[4] = DstOpXor;
log_val[5] = DstOpAdd;
srcF = ((0xff & SrcOpAnd) ^ SrcOpXor) + SrcOpAdd;
mul8_srcF = mul8table[srcF];
vis_write_gsr(7 << 3);
if (pMask != NULL) {
pMask += maskOff;
if (dstScan == 4*width && srcScan == dstScan && maskScan == width) {
width *= height;
height = 1;
}
for (j = 0; j < height; j++) {
IntRgbToIntRgbAlphaMaskBlit_line(dstBase, srcBase, pMask,
width, log_val, mul8_extra,
mul8_srcF, (void*)mul8table);
PTR_ADD(dstBase, dstScan);
PTR_ADD(srcBase, srcScan);
PTR_ADD(pMask, maskScan);
}
} else {
if (dstScan == 4*width && srcScan == dstScan) {
width *= height;
height = 1;
}
for (j = 0; j < height; j++) {
IntRgbToIntRgbAlphaMaskBlit_A1_line(dstBase, srcBase, pMask,
width, log_val, mul8_extra,
mul8_srcF, (void*)mul8table);
PTR_ADD(dstBase, dstScan);
PTR_ADD(srcBase, srcScan);
}
}
}
/***************************************************************/
void ADD_SUFF(IntRgbToIntBgrAlphaMaskBlit)(MASKBLIT_PARAMS)
{
mlib_s32 extraA, srcF;
mlib_s32 dstScan = pDstInfo->scanStride;
mlib_s32 srcScan = pSrcInfo->scanStride;
mlib_s32 log_val[6];
mlib_s32 j;
mlib_s32 SrcOpAnd;
mlib_s32 SrcOpXor;
mlib_s32 SrcOpAdd;
mlib_s32 DstOpAnd;
mlib_s32 DstOpXor;
mlib_s32 DstOpAdd;
mlib_u8 *mul8_extra, *mul8_srcF;
extraA = (mlib_s32)(pCompInfo->details.extraAlpha * 255.0 + 0.5);
mul8_extra = mul8table[extraA];
SrcOpAnd = (AlphaRules[pCompInfo->rule].srcOps).andval;
SrcOpXor = (AlphaRules[pCompInfo->rule].srcOps).xorval;
SrcOpAdd = (AlphaRules[pCompInfo->rule].srcOps).addval;
SrcOpAdd -= SrcOpXor;
DstOpAnd = (AlphaRules[pCompInfo->rule].dstOps).andval;
DstOpXor = (AlphaRules[pCompInfo->rule].dstOps).xorval;
DstOpAdd = (AlphaRules[pCompInfo->rule].dstOps).addval;
DstOpAdd -= DstOpXor;
log_val[3] = DstOpAnd;
log_val[4] = DstOpXor;
log_val[5] = DstOpAdd;
srcF = ((0xff & SrcOpAnd) ^ SrcOpXor) + SrcOpAdd;
mul8_srcF = mul8table[srcF];
vis_write_gsr(7 << 3);
if (pMask != NULL) {
pMask += maskOff;
if (dstScan == 4*width && srcScan == dstScan && maskScan == width) {
width *= height;
height = 1;
}
for (j = 0; j < height; j++) {
IntRgbToIntBgrAlphaMaskBlit_line(dstBase, srcBase, pMask,
width, log_val, mul8_extra,
mul8_srcF, (void*)mul8table);
PTR_ADD(dstBase, dstScan);
PTR_ADD(srcBase, srcScan);
PTR_ADD(pMask, maskScan);
}
} else {
if (dstScan == 4*width && srcScan == dstScan) {
width *= height;
height = 1;
}
for (j = 0; j < height; j++) {
IntRgbToIntBgrAlphaMaskBlit_A1_line(dstBase, srcBase, pMask,
width, log_val, mul8_extra,
mul8_srcF, (void*)mul8table);
PTR_ADD(dstBase, dstScan);
PTR_ADD(srcBase, srcScan);
}
}
}
/***************************************************************/
#ifdef MLIB_ADD_SUFF
#pragma weak IntBgrToIntBgrAlphaMaskBlit_F = IntRgbToIntRgbAlphaMaskBlit_F
#else
#pragma weak IntBgrToIntBgrAlphaMaskBlit = IntRgbToIntRgbAlphaMaskBlit
#endif
/***************************************************************/
/*
mlib_d64 buff[BUFF_SIZE/2];
void *pbuff = buff;
if (width > BUFF_SIZE) pbuff = mlib_malloc(width*sizeof(mlib_s32));
ADD_SUFF(ThreeByteBgrToIntArgbConvert)(rasBase, pbuff, width, 1,
pRasInfo, pRasInfo,
pPrim, pCompInfo);
ADD_SUFF(IntArgbToThreeByteBgrConvert)(pbuff, rasBase, width, 1,
pRasInfo, pRasInfo,
pPrim, pCompInfo);
if (pbuff != buff) {
mlib_free(pbuff);
}
*/
#endif