blob: 32e00163575fd565936676423c227a3b1ff68c8d [file] [log] [blame]
/*
* Copyright (c) 2003, Oracle and/or its affiliates. All rights reserved.
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
*
* This code is free software; you can redistribute it and/or modify it
* under the terms of the GNU General Public License version 2 only, as
* published by the Free Software Foundation. Oracle designates this
* particular file as subject to the "Classpath" exception as provided
* by Oracle in the LICENSE file that accompanied this code.
*
* This code is distributed in the hope that it will be useful, but WITHOUT
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
* version 2 for more details (a copy is included in the LICENSE file that
* accompanied this code).
*
* You should have received a copy of the GNU General Public License version
* 2 along with this work; if not, write to the Free Software Foundation,
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
*
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
* or visit www.oracle.com if you need additional information or have any
* questions.
*/
#ifndef __MLIB_V_IMAGECONSTLOGIC_H
#define __MLIB_V_IMAGECONSTLOGIC_H
#if defined ( VIS )
#if VIS >= 0x200
#error This include file can be used with VIS 1.0 only
#endif /* VIS >= 0x200 */
#endif /* defined ( VIS ) */
#include <mlib_image.h>
#include <vis_proto.h>
#include <mlib_ImageCheck.h>
#include <mlib_ImageLogic_proto.h>
#include <mlib_v_ImageLogic_proto.h>
#ifdef __cplusplus
extern "C" {
#endif /* __cplusplus */
/*
* Macro definitions for VIS version image logical functions.
*/
/***************************************************************/
#define VALIDATE() \
mlib_u8 *sp, *sl; /* pointers for pixel and line of source */ \
mlib_u8 *dp, *dl;/* pointers for pixel and line of dst */ \
mlib_s32 width, height, type, nchannels; \
mlib_s32 stride; /* for src */ \
mlib_s32 strided; /* for dst */ \
mlib_u32 c01, c02, c03, c04; \
mlib_d64 dc01, dc02, dc03; \
\
MLIB_IMAGE_SIZE_EQUAL(dst,src); \
MLIB_IMAGE_TYPE_EQUAL(dst,src); \
MLIB_IMAGE_CHAN_EQUAL(dst,src); \
\
dp = (mlib_u8 *) mlib_ImageGetData(dst); \
sp = (mlib_u8 *) mlib_ImageGetData(src); \
height = mlib_ImageGetHeight(dst); \
width = mlib_ImageGetWidth(dst); \
stride = mlib_ImageGetStride(src); \
strided = mlib_ImageGetStride(dst); \
nchannels = mlib_ImageGetChannels(dst); \
type = mlib_ImageGetType(dst); \
\
if (type == MLIB_SHORT) { \
width *= (2 * nchannels); \
if (nchannels == 1) { \
c01 = c[0] & 0xFFFF; c01 |= (c01 << 16); \
dc01 = vis_to_double_dup(c01); \
} else if (nchannels == 2) { \
c01 = ((c[0] & 0xFFFF) << 16) | (c[1] & 0xFFFF); \
dc01 = vis_to_double_dup(c01); \
} else if (nchannels == 3) { \
c01 = ((c[0] & 0xFFFF) << 16) | (c[1] & 0xFFFF); \
c02 = ((c[2] & 0xFFFF) << 16) | (c01 >> 16); \
c03 = (c01 << 16) | (c02 >> 16); \
dc01= vis_to_double(c01, c02); \
dc02= vis_to_double(c03, c01); \
dc03= vis_to_double(c02, c03); \
} else { \
c01 = ((c[0] & 0xFFFF) << 16) | (c[1] & 0xFFFF); \
c02 = ((c[2] & 0xFFFF) << 16) | (c[3] & 0xFFFF); \
dc01= vis_to_double(c01, c02); \
} \
\
} else if (type == MLIB_BYTE) { \
width *= nchannels; \
if (nchannels == 1) { \
c01 = c[0] & 0xFF; c01 |= (c01 << 8); \
c01 |= (c01 << 16); \
dc01 = vis_to_double_dup(c01); \
} else if (nchannels == 2) { \
c01 = ((c[0] & 0xFF) << 8) | (c[1] & 0xFF); \
c01 |= (c01 << 16); \
dc01 = vis_to_double_dup(c01); \
} else if (nchannels == 3) { \
c01 = ((c[0] & 0xFF) << 16) | ((c[1] & 0xFF) << 8) | \
(c[2] & 0xFF); \
c02 = (c01 << 16) | (c01 >> 8); \
c03 = (c01 << 24) | c01; \
c01 = (c01 << 8) | (c01 >> 16); \
dc01= vis_to_double(c01, c02); \
dc02= vis_to_double(c03, c01); \
dc03= vis_to_double(c02, c03); \
} else { \
c01 = ((c[0] & 0xFF) << 24) | ((c[1] & 0xFF) << 16) | \
((c[2] & 0xFF) << 8) | (c[3] & 0xFF); \
dc01 = vis_to_double_dup(c01); \
} \
} else { \
width *= (4 * nchannels); \
if (nchannels == 1) { \
c01 = c[0] & 0xFFFFFFFF; \
dc01 = vis_to_double_dup(c01); \
} else if (nchannels == 2) { \
c01 = c[0] & 0xFFFFFFFF; c02 = c[1] & 0xFFFFFFFF; \
dc01 = vis_to_double(c01, c02); \
} else if (nchannels == 3) { \
c01 = c[0] & 0xFFFFFFFF; c02 = c[1] & 0xFFFFFFFF; \
c03 = c[2] & 0xFFFFFFFF; \
dc01= vis_to_double(c01, c02); \
dc02= vis_to_double(c03, c01); \
dc03= vis_to_double(c02, c03); \
} else { \
c01 = c[0] & 0xFFFFFFFF; c02 = c[1] & 0xFFFFFFFF; \
c03 = c[2] & 0xFFFFFFFF; c04 = c[3] & 0xFFFFFFFF; \
dc01= vis_to_double(c01, c02); \
dc02= vis_to_double(c03, c04); \
} \
} \
\
if ((width > stride) || (width > strided)) \
return MLIB_FAILURE
/***************************************************************/
static mlib_status mlib_v_ImageConstLogic(mlib_image *dst,
mlib_image *src,
mlib_s32 *c)
{
mlib_s32 i, j;
mlib_s32 offdst, offsrc, emask;
mlib_d64 *dpp, *spp;
mlib_d64 sa1, sa2, da, sa;
mlib_d64 ssa, ssa1, ssa2, sa3, sa4;
mlib_s32 amount;
mlib_u8 *dend;
mlib_d64 c1, c2, c3;
VALIDATE();
if (nchannels == 3) {
if ((width == stride) && (width == strided) && ((width - (width / 3) * 3) == 0)) {
amount = height * width;
dend = dp + amount - 1;
offdst = ((mlib_addr) dp) & 7;
offsrc = ((mlib_addr) sp) & 7;
if (offsrc == offdst) {
/* prepare the destination addresses */
dpp = (mlib_d64 *) vis_alignaddr(dp, 0);
i = (mlib_u8 *) dpp - dp;
if (i != 0) {
vis_alignaddr((void *)(8 - offdst), 0);
c3 = vis_faligndata(dc03, dc01);
c1 = vis_faligndata(dc01, dc02);
c2 = vis_faligndata(dc02, dc03);
}
else {
c1 = dc01;
c2 = dc02;
c3 = dc03;
}
/* prepare the destination addresses */
spp = (mlib_d64 *) vis_alignaddr(sp, 0);
if (i != 0) {
/* generate edge mask for the start point */
emask = vis_edge8(dp, dend);
sa1 = *spp++;
da = VIS_CONSTLOGIC(c3, sa1);
vis_pst_8(da, dpp++, emask);
i += 8;
}
#pragma pipeloop(0)
for (; i < amount - 24; i += 24) {
dpp[0] = VIS_CONSTLOGIC(c1, spp[0]);
dpp[1] = VIS_CONSTLOGIC(c2, spp[1]);
dpp[2] = VIS_CONSTLOGIC(c3, spp[2]);
dpp += 3;
spp += 3;
}
if (i < amount) {
emask = vis_edge8(dpp, dend);
sa1 = *spp++;
da = VIS_CONSTLOGIC(c1, sa1);
vis_pst_8(da, dpp++, emask);
i += 8;
}
if (i < amount) {
emask = vis_edge8(dpp, dend);
sa1 = *spp++;
da = VIS_CONSTLOGIC(c2, sa1);
vis_pst_8(da, dpp++, emask);
i += 8;
}
if (i < amount) {
emask = vis_edge8(dpp, dend);
sa1 = *spp++;
da = VIS_CONSTLOGIC(c3, sa1);
vis_pst_8(da, dpp, emask);
}
}
else {
/* prepare the destination addresses */
dpp = (mlib_d64 *) vis_alignaddr(dp, 0);
i = (mlib_u8 *) dpp - dp;
if (i != 0) {
vis_alignaddr((void *)(8 - offdst), 0);
c3 = vis_faligndata(dc03, dc01);
c1 = vis_faligndata(dc01, dc02);
c2 = vis_faligndata(dc02, dc03);
}
else {
c1 = dc01;
c2 = dc02;
c3 = dc03;
}
/* prepare the destination addresses */
spp = (mlib_d64 *) vis_alignaddr(sp, i);
sa1 = spp[0];
if (i != 0) {
/* generate edge mask for the start point */
emask = vis_edge8(dp, dend);
sa2 = spp[1];
sa = vis_faligndata(sa1, sa2);
da = VIS_CONSTLOGIC(c3, sa);
vis_pst_8(da, dpp++, emask);
sa1 = sa2;
i += 8;
spp++;
}
#pragma pipeloop(0)
for (; i < amount - 24; i += 24) {
sa2 = spp[1];
ssa = vis_faligndata(sa1, sa2);
dpp[0] = VIS_CONSTLOGIC(c1, ssa);
sa3 = spp[2];
ssa1 = vis_faligndata(sa2, sa3);
dpp[1] = VIS_CONSTLOGIC(c2, ssa1);
sa4 = spp[3];
ssa2 = vis_faligndata(sa3, sa4);
dpp[2] = VIS_CONSTLOGIC(c3, ssa2);
sa1 = sa4;
dpp += 3;
spp += 3;
}
if (i < amount) {
emask = vis_edge8(dpp, dend);
sa2 = spp[1];
sa = vis_faligndata(sa1, sa2);
da = VIS_CONSTLOGIC(c1, sa);
vis_pst_8(da, dpp++, emask);
sa1 = sa2;
i += 8;
spp++;
}
if (i < amount) {
emask = vis_edge8(dpp, dend);
sa2 = spp[1];
sa = vis_faligndata(sa1, sa2);
da = VIS_CONSTLOGIC(c2, sa);
vis_pst_8(da, dpp++, emask);
sa1 = sa2;
i += 8;
spp++;
}
if (i < amount) {
emask = vis_edge8(dpp, dend);
sa2 = spp[1];
sa = vis_faligndata(sa1, sa2);
da = VIS_CONSTLOGIC(c3, sa);
vis_pst_8(da, dpp++, emask);
}
}
}
else {
sl = sp;
dl = dp;
amount = width;
for (j = 0; j < height; j++) {
dend = dp + amount - 1;
offdst = ((mlib_addr) dp) & 7;
offsrc = ((mlib_addr) sp) & 7;
if (offsrc == offdst) {
/* prepare the destination addresses */
dpp = (mlib_d64 *) vis_alignaddr(dp, 0);
i = (mlib_u8 *) dpp - dp;
if (i != 0) {
vis_alignaddr((void *)(8 - offdst), 0);
c3 = vis_faligndata(dc03, dc01);
c1 = vis_faligndata(dc01, dc02);
c2 = vis_faligndata(dc02, dc03);
}
else {
c1 = dc01;
c2 = dc02;
c3 = dc03;
}
/* prepare the destination addresses */
spp = (mlib_d64 *) vis_alignaddr(sp, 0);
if (i != 0) {
/* generate edge mask for the start point */
emask = vis_edge8(dp, dend);
sa1 = *spp++;
da = VIS_CONSTLOGIC(c3, sa1);
vis_pst_8(da, dpp++, emask);
i += 8;
}
#pragma pipeloop(0)
for (; i < amount - 24; i += 24) {
dpp[0] = VIS_CONSTLOGIC(c1, spp[0]);
dpp[1] = VIS_CONSTLOGIC(c2, spp[1]);
dpp[2] = VIS_CONSTLOGIC(c3, spp[2]);
dpp += 3;
spp += 3;
}
if (i < amount) {
emask = vis_edge8(dpp, dend);
sa1 = *spp++;
da = VIS_CONSTLOGIC(c1, sa1);
vis_pst_8(da, dpp++, emask);
i += 8;
}
if (i < amount) {
emask = vis_edge8(dpp, dend);
sa1 = *spp++;
da = VIS_CONSTLOGIC(c2, sa1);
vis_pst_8(da, dpp++, emask);
i += 8;
}
if (i < amount) {
emask = vis_edge8(dpp, dend);
sa1 = *spp++;
da = VIS_CONSTLOGIC(c3, sa1);
vis_pst_8(da, dpp, emask);
}
}
else {
/* prepare the destination addresses */
dpp = (mlib_d64 *) vis_alignaddr(dp, 0);
i = (mlib_u8 *) dpp - dp;
if (i != 0) {
vis_alignaddr((void *)(8 - offdst), 0);
c3 = vis_faligndata(dc03, dc01);
c1 = vis_faligndata(dc01, dc02);
c2 = vis_faligndata(dc02, dc03);
}
else {
c1 = dc01;
c2 = dc02;
c3 = dc03;
}
/* prepare the destination addresses */
spp = (mlib_d64 *) vis_alignaddr(sp, i);
sa1 = spp[0];
if (i != 0) {
/* generate edge mask for the start point */
emask = vis_edge8(dp, dend);
sa2 = spp[1];
sa = vis_faligndata(sa1, sa2);
da = VIS_CONSTLOGIC(c3, sa);
vis_pst_8(da, dpp++, emask);
sa1 = sa2;
i += 8;
spp++;
}
#pragma pipeloop(0)
for (; i < amount - 24; i += 24) {
sa2 = spp[1];
sa = vis_faligndata(sa1, sa2);
dpp[0] = VIS_CONSTLOGIC(c1, sa);
sa1 = spp[2];
sa = vis_faligndata(sa2, sa1);
dpp[1] = VIS_CONSTLOGIC(c2, sa);
sa2 = spp[3];
sa = vis_faligndata(sa1, sa2);
dpp[2] = VIS_CONSTLOGIC(c3, sa);
sa1 = sa2;
dpp += 3;
spp += 3;
}
if (i < amount) {
emask = vis_edge8(dpp, dend);
sa2 = spp[1];
sa = vis_faligndata(sa1, sa2);
da = VIS_CONSTLOGIC(c1, sa);
vis_pst_8(da, dpp++, emask);
sa1 = sa2;
i += 8;
spp++;
}
if (i < amount) {
emask = vis_edge8(dpp, dend);
sa2 = spp[1];
sa = vis_faligndata(sa1, sa2);
da = VIS_CONSTLOGIC(c2, sa);
vis_pst_8(da, dpp++, emask);
sa1 = sa2;
i += 8;
spp++;
}
if (i < amount) {
emask = vis_edge8(dpp, dend);
sa2 = spp[1];
sa = vis_faligndata(sa1, sa2);
da = VIS_CONSTLOGIC(c3, sa);
vis_pst_8(da, dpp++, emask);
}
}
sp = sl += stride;
dp = dl += strided;
}
}
}
else if ((type != MLIB_INT) || (nchannels != 4)) {
if ((width == stride) && (width == strided)) {
amount = height * width;
dend = dp + amount - 1;
offdst = ((mlib_addr) dp) & 7;
offsrc = ((mlib_addr) sp) & 7;
if (offsrc == offdst) {
/* prepare the destination addresses */
dpp = (mlib_d64 *) vis_alignaddr(dp, 0);
i = (mlib_u8 *) dpp - dp;
if (i != 0) {
vis_alignaddr((void *)(8 - offdst), 0);
c1 = vis_faligndata(dc01, dc01);
}
else {
c1 = dc01;
}
/* prepare the destination addresses */
spp = (mlib_d64 *) vis_alignaddr(sp, 0);
if (i != 0) {
/* generate edge mask for the start point */
emask = vis_edge8(dp, dend);
sa1 = *spp++;
da = VIS_CONSTLOGIC(c1, sa1);
vis_pst_8(da, dpp++, emask);
i += 8;
}
#pragma pipeloop(0)
for (; i < amount - 8; i += 8) {
*dpp++ = VIS_CONSTLOGIC(c1, *spp);
spp++;
}
if (i < amount) {
emask = vis_edge8(dpp, dend);
sa1 = *spp;
da = VIS_CONSTLOGIC(c1, sa1);
vis_pst_8(da, dpp, emask);
}
}
else {
/* prepare the destination addresses */
dpp = (mlib_d64 *) vis_alignaddr(dp, 0);
i = (mlib_u8 *) dpp - dp;
if (i != 0) {
vis_alignaddr((void *)(8 - offdst), 0);
c1 = vis_faligndata(dc01, dc01);
}
else {
c1 = dc01;
}
/* prepare the destination addresses */
spp = (mlib_d64 *) vis_alignaddr(sp, i);
sa1 = spp[0];
if (i != 0) {
/* generate edge mask for the start point */
emask = vis_edge8(dp, dend);
sa2 = spp[1];
sa = vis_faligndata(sa1, sa2);
da = VIS_CONSTLOGIC(c1, sa);
vis_pst_8(da, dpp++, emask);
sa1 = sa2;
i += 8;
spp++;
}
#pragma pipeloop(0)
for (; i < amount - 8; i += 8) {
sa2 = spp[1];
sa = vis_faligndata(sa1, sa2);
*dpp++ = VIS_CONSTLOGIC(c1, sa);
sa1 = sa2;
spp++;
}
if (i < amount) {
emask = vis_edge8(dpp, dend);
sa2 = spp[1];
sa = vis_faligndata(sa1, sa2);
da = VIS_CONSTLOGIC(c1, sa);
vis_pst_8(da, dpp, emask);
}
}
}
else {
sl = sp;
dl = dp;
amount = width;
for (j = 0; j < height; j++) {
dend = dp + amount - 1;
offdst = ((mlib_addr) dp) & 7;
offsrc = ((mlib_addr) sp) & 7;
if (offsrc == offdst) {
/* prepare the destination addresses */
dpp = (mlib_d64 *) vis_alignaddr(dp, 0);
i = (mlib_u8 *) dpp - dp;
if (i != 0) {
vis_alignaddr((void *)(8 - offdst), 0);
c1 = vis_faligndata(dc01, dc01);
}
else {
c1 = dc01;
}
/* prepare the destination addresses */
spp = (mlib_d64 *) vis_alignaddr(sp, 0);
if (i != 0) {
/* generate edge mask for the start point */
emask = vis_edge8(dp, dend);
sa1 = *spp++;
da = VIS_CONSTLOGIC(c1, sa1);
vis_pst_8(da, dpp++, emask);
i += 8;
}
#pragma pipeloop(0)
for (; i < amount - 8; i += 8) {
*dpp++ = VIS_CONSTLOGIC(c1, *spp);
spp++;
}
if (i < amount) {
emask = vis_edge8(dpp, dend);
sa1 = *spp;
da = VIS_CONSTLOGIC(c1, sa1);
vis_pst_8(da, dpp, emask);
}
}
else {
/* prepare the destination addresses */
dpp = (mlib_d64 *) vis_alignaddr(dp, 0);
i = (mlib_u8 *) dpp - dp;
if (i != 0) {
vis_alignaddr((void *)(8 - offdst), 0);
c1 = vis_faligndata(dc01, dc01);
}
else {
c1 = dc01;
}
/* prepare the destination addresses */
spp = (mlib_d64 *) vis_alignaddr(sp, i);
sa1 = spp[0];
if (i != 0) {
/* generate edge mask for the start point */
emask = vis_edge8(dp, dend);
sa2 = spp[1];
sa = vis_faligndata(sa1, sa2);
da = VIS_CONSTLOGIC(c1, sa);
vis_pst_8(da, dpp++, emask);
sa1 = sa2;
i += 8;
spp++;
}
#pragma pipeloop(0)
for (; i < amount - 8; i += 8) {
sa2 = spp[1];
sa = vis_faligndata(sa1, sa2);
*dpp++ = VIS_CONSTLOGIC(c1, sa);
sa1 = sa2;
spp++;
}
if (i < amount) {
emask = vis_edge8(dpp, dend);
sa2 = spp[1];
sa = vis_faligndata(sa1, sa2);
da = VIS_CONSTLOGIC(c1, sa);
vis_pst_8(da, dpp, emask);
}
}
sp = sl += stride;
dp = dl += strided;
}
}
}
else {
if ((width == stride) && (width == strided)) {
amount = height * width;
dend = dp + amount - 1;
offdst = ((mlib_addr) dp) & 7;
offsrc = ((mlib_addr) sp) & 7;
if (offsrc == offdst) {
/* prepare the destination addresses */
dpp = (mlib_d64 *) vis_alignaddr(dp, 0);
i = (mlib_u8 *) dpp - dp;
if (i != 0) {
vis_alignaddr((void *)(8 - offdst), 0);
c2 = vis_faligndata(dc02, dc01);
c1 = vis_faligndata(dc01, dc02);
}
else {
c1 = dc01;
c2 = dc02;
}
/* prepare the destination addresses */
spp = (mlib_d64 *) vis_alignaddr(sp, 0);
if (i != 0) {
/* generate edge mask for the start point */
emask = vis_edge8(dp, dend);
sa1 = *spp++;
da = VIS_CONSTLOGIC(c2, sa1);
vis_pst_8(da, dpp++, emask);
i += 8;
}
#pragma pipeloop(0)
for (; i < amount - 16; i += 16) {
dpp[0] = VIS_CONSTLOGIC(c1, spp[0]);
dpp[1] = VIS_CONSTLOGIC(c2, spp[1]);
dpp += 2;
spp += 2;
}
if (i < amount) {
emask = vis_edge8(dpp, dend);
sa1 = *spp++;
da = VIS_CONSTLOGIC(c1, sa1);
vis_pst_8(da, dpp++, emask);
i += 8;
}
if (i < amount) {
emask = vis_edge8(dpp, dend);
sa1 = *spp;
da = VIS_CONSTLOGIC(c2, sa1);
vis_pst_8(da, dpp++, emask);
}
}
else {
/* prepare the destination addresses */
dpp = (mlib_d64 *) vis_alignaddr(dp, 0);
i = (mlib_u8 *) dpp - dp;
if (i != 0) {
vis_alignaddr((void *)(8 - offdst), 0);
c2 = vis_faligndata(dc02, dc01);
c1 = vis_faligndata(dc01, dc02);
}
else {
c1 = dc01;
c2 = dc02;
}
/* prepare the destination addresses */
spp = (mlib_d64 *) vis_alignaddr(sp, i);
sa1 = spp[0];
if (i != 0) {
/* generate edge mask for the start point */
emask = vis_edge8(dp, dend);
sa2 = spp[1];
sa = vis_faligndata(sa1, sa2);
da = VIS_CONSTLOGIC(c2, sa);
vis_pst_8(da, dpp++, emask);
sa1 = sa2;
i += 8;
spp++;
}
#pragma pipeloop(0)
for (; i < amount - 16; i += 16) {
sa2 = spp[1];
ssa = vis_faligndata(sa1, sa2);
dpp[0] = VIS_CONSTLOGIC(c1, ssa);
sa3 = spp[2];
ssa1 = vis_faligndata(sa2, sa3);
dpp[1] = VIS_CONSTLOGIC(c2, ssa1);
sa1 = sa3;
dpp += 2;
spp += 2;
}
if (i < amount) {
emask = vis_edge8(dpp, dend);
sa2 = spp[1];
sa = vis_faligndata(sa1, sa2);
da = VIS_CONSTLOGIC(c1, sa);
vis_pst_8(da, dpp++, emask);
sa1 = sa2;
i += 8;
spp++;
}
if (i < amount) {
emask = vis_edge8(dpp, dend);
sa2 = spp[1];
sa = vis_faligndata(sa1, sa2);
da = VIS_CONSTLOGIC(c2, sa);
vis_pst_8(da, dpp++, emask);
}
}
}
else {
sl = sp;
dl = dp;
amount = width;
for (j = 0; j < height; j++) {
dend = dp + amount - 1;
offdst = ((mlib_addr) dp) & 7;
offsrc = ((mlib_addr) sp) & 7;
if (offsrc == offdst) {
/* prepare the destination addresses */
dpp = (mlib_d64 *) vis_alignaddr(dp, 0);
i = (mlib_u8 *) dpp - dp;
if (i != 0) {
vis_alignaddr((void *)(8 - offdst), 0);
c2 = vis_faligndata(dc02, dc01);
c1 = vis_faligndata(dc01, dc02);
}
else {
c1 = dc01;
c2 = dc02;
}
/* prepare the destination addresses */
spp = (mlib_d64 *) vis_alignaddr(sp, 0);
if (i != 0) {
/* generate edge mask for the start point */
emask = vis_edge8(dp, dend);
sa1 = *spp++;
da = VIS_CONSTLOGIC(c2, sa1);
vis_pst_8(da, dpp++, emask);
i += 8;
}
#pragma pipeloop(0)
for (; i < amount - 16; i += 16) {
dpp[0] = VIS_CONSTLOGIC(c1, spp[0]);
dpp[1] = VIS_CONSTLOGIC(c2, spp[1]);
dpp += 2;
spp += 2;
}
if (i < amount) {
emask = vis_edge8(dpp, dend);
sa1 = *spp++;
da = VIS_CONSTLOGIC(c1, sa1);
vis_pst_8(da, dpp++, emask);
i += 8;
}
if (i < amount) {
emask = vis_edge8(dpp, dend);
sa1 = *spp;
da = VIS_CONSTLOGIC(c2, sa1);
vis_pst_8(da, dpp++, emask);
}
}
else {
/* prepare the destination addresses */
dpp = (mlib_d64 *) vis_alignaddr(dp, 0);
i = (mlib_u8 *) dpp - dp;
if (i != 0) {
vis_alignaddr((void *)(8 - offdst), 0);
c2 = vis_faligndata(dc02, dc01);
c1 = vis_faligndata(dc01, dc02);
}
else {
c1 = dc01;
c2 = dc02;
}
/* prepare the destination addresses */
spp = (mlib_d64 *) vis_alignaddr(sp, i);
sa1 = spp[0];
if (i != 0) {
/* generate edge mask for the start point */
emask = vis_edge8(dp, dend);
sa2 = spp[1];
sa = vis_faligndata(sa1, sa2);
da = VIS_CONSTLOGIC(c2, sa);
vis_pst_8(da, dpp++, emask);
sa1 = sa2;
i += 8;
spp++;
}
#pragma pipeloop(0)
for (; i < amount - 16; i += 16) {
sa2 = spp[1];
ssa = vis_faligndata(sa1, sa2);
dpp[0] = VIS_CONSTLOGIC(c1, ssa);
sa3 = spp[2];
ssa1 = vis_faligndata(sa2, sa3);
dpp[1] = VIS_CONSTLOGIC(c2, ssa1);
sa1 = sa3;
dpp += 2;
spp += 2;
}
if (i < amount) {
emask = vis_edge8(dpp, dend);
sa2 = spp[1];
sa = vis_faligndata(sa1, sa2);
da = VIS_CONSTLOGIC(c1, sa);
vis_pst_8(da, dpp++, emask);
sa1 = sa2;
i += 8;
spp++;
}
if (i < amount) {
emask = vis_edge8(dpp, dend);
sa2 = spp[1];
sa = vis_faligndata(sa1, sa2);
da = VIS_CONSTLOGIC(c2, sa);
vis_pst_8(da, dpp++, emask);
}
}
sp = sl += stride;
dp = dl += strided;
}
}
}
return MLIB_SUCCESS;
}
/***************************************************************/
#ifdef __cplusplus
}
#endif /* __cplusplus */
#endif /* __MLIB_V_IMAGECONSTLOGIC_H */