0N/A/*
2362N/A * Copyright (c) 2003, Oracle and/or its affiliates. All rights reserved.
0N/A * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
0N/A *
0N/A * This code is free software; you can redistribute it and/or modify it
0N/A * under the terms of the GNU General Public License version 2 only, as
2362N/A * published by the Free Software Foundation. Oracle designates this
0N/A * particular file as subject to the "Classpath" exception as provided
2362N/A * by Oracle in the LICENSE file that accompanied this code.
0N/A *
0N/A * This code is distributed in the hope that it will be useful, but WITHOUT
0N/A * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
0N/A * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
0N/A * version 2 for more details (a copy is included in the LICENSE file that
0N/A * accompanied this code).
0N/A *
0N/A * You should have received a copy of the GNU General Public License version
0N/A * 2 along with this work; if not, write to the Free Software Foundation,
0N/A * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
0N/A *
2362N/A * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
2362N/A * or visit www.oracle.com if you need additional information or have any
2362N/A * questions.
0N/A */
0N/A
0N/A#ifndef __MLIB_V_IMAGECONSTLOGIC_H
0N/A#define __MLIB_V_IMAGECONSTLOGIC_H
0N/A
0N/A
0N/A#if defined ( VIS )
0N/A#if VIS >= 0x200
0N/A#error This include file can be used with VIS 1.0 only
0N/A#endif /* VIS >= 0x200 */
0N/A#endif /* defined ( VIS ) */
0N/A
0N/A#include <mlib_image.h>
0N/A#include <vis_proto.h>
0N/A#include <mlib_ImageCheck.h>
0N/A#include <mlib_ImageLogic_proto.h>
0N/A#include <mlib_v_ImageLogic_proto.h>
0N/A
0N/A#ifdef __cplusplus
0N/Aextern "C" {
0N/A#endif /* __cplusplus */
0N/A
0N/A/*
0N/A * Macro definitions for VIS version image logical functions.
0N/A */
0N/A
0N/A/***************************************************************/
0N/A
0N/A#define VALIDATE() \
0N/A mlib_u8 *sp, *sl; /* pointers for pixel and line of source */ \
0N/A mlib_u8 *dp, *dl;/* pointers for pixel and line of dst */ \
0N/A mlib_s32 width, height, type, nchannels; \
0N/A mlib_s32 stride; /* for src */ \
0N/A mlib_s32 strided; /* for dst */ \
0N/A mlib_u32 c01, c02, c03, c04; \
0N/A mlib_d64 dc01, dc02, dc03; \
0N/A \
0N/A MLIB_IMAGE_SIZE_EQUAL(dst,src); \
0N/A MLIB_IMAGE_TYPE_EQUAL(dst,src); \
0N/A MLIB_IMAGE_CHAN_EQUAL(dst,src); \
0N/A \
0N/A dp = (mlib_u8 *) mlib_ImageGetData(dst); \
0N/A sp = (mlib_u8 *) mlib_ImageGetData(src); \
0N/A height = mlib_ImageGetHeight(dst); \
0N/A width = mlib_ImageGetWidth(dst); \
0N/A stride = mlib_ImageGetStride(src); \
0N/A strided = mlib_ImageGetStride(dst); \
0N/A nchannels = mlib_ImageGetChannels(dst); \
0N/A type = mlib_ImageGetType(dst); \
0N/A \
0N/A if (type == MLIB_SHORT) { \
0N/A width *= (2 * nchannels); \
0N/A if (nchannels == 1) { \
0N/A c01 = c[0] & 0xFFFF; c01 |= (c01 << 16); \
0N/A dc01 = vis_to_double_dup(c01); \
0N/A } else if (nchannels == 2) { \
0N/A c01 = ((c[0] & 0xFFFF) << 16) | (c[1] & 0xFFFF); \
0N/A dc01 = vis_to_double_dup(c01); \
0N/A } else if (nchannels == 3) { \
0N/A c01 = ((c[0] & 0xFFFF) << 16) | (c[1] & 0xFFFF); \
0N/A c02 = ((c[2] & 0xFFFF) << 16) | (c01 >> 16); \
0N/A c03 = (c01 << 16) | (c02 >> 16); \
0N/A dc01= vis_to_double(c01, c02); \
0N/A dc02= vis_to_double(c03, c01); \
0N/A dc03= vis_to_double(c02, c03); \
0N/A } else { \
0N/A c01 = ((c[0] & 0xFFFF) << 16) | (c[1] & 0xFFFF); \
0N/A c02 = ((c[2] & 0xFFFF) << 16) | (c[3] & 0xFFFF); \
0N/A dc01= vis_to_double(c01, c02); \
0N/A } \
0N/A \
0N/A } else if (type == MLIB_BYTE) { \
0N/A width *= nchannels; \
0N/A if (nchannels == 1) { \
0N/A c01 = c[0] & 0xFF; c01 |= (c01 << 8); \
0N/A c01 |= (c01 << 16); \
0N/A dc01 = vis_to_double_dup(c01); \
0N/A } else if (nchannels == 2) { \
0N/A c01 = ((c[0] & 0xFF) << 8) | (c[1] & 0xFF); \
0N/A c01 |= (c01 << 16); \
0N/A dc01 = vis_to_double_dup(c01); \
0N/A } else if (nchannels == 3) { \
0N/A c01 = ((c[0] & 0xFF) << 16) | ((c[1] & 0xFF) << 8) | \
0N/A (c[2] & 0xFF); \
0N/A c02 = (c01 << 16) | (c01 >> 8); \
0N/A c03 = (c01 << 24) | c01; \
0N/A c01 = (c01 << 8) | (c01 >> 16); \
0N/A dc01= vis_to_double(c01, c02); \
0N/A dc02= vis_to_double(c03, c01); \
0N/A dc03= vis_to_double(c02, c03); \
0N/A } else { \
0N/A c01 = ((c[0] & 0xFF) << 24) | ((c[1] & 0xFF) << 16) | \
0N/A ((c[2] & 0xFF) << 8) | (c[3] & 0xFF); \
0N/A dc01 = vis_to_double_dup(c01); \
0N/A } \
0N/A } else { \
0N/A width *= (4 * nchannels); \
0N/A if (nchannels == 1) { \
0N/A c01 = c[0] & 0xFFFFFFFF; \
0N/A dc01 = vis_to_double_dup(c01); \
0N/A } else if (nchannels == 2) { \
0N/A c01 = c[0] & 0xFFFFFFFF; c02 = c[1] & 0xFFFFFFFF; \
0N/A dc01 = vis_to_double(c01, c02); \
0N/A } else if (nchannels == 3) { \
0N/A c01 = c[0] & 0xFFFFFFFF; c02 = c[1] & 0xFFFFFFFF; \
0N/A c03 = c[2] & 0xFFFFFFFF; \
0N/A dc01= vis_to_double(c01, c02); \
0N/A dc02= vis_to_double(c03, c01); \
0N/A dc03= vis_to_double(c02, c03); \
0N/A } else { \
0N/A c01 = c[0] & 0xFFFFFFFF; c02 = c[1] & 0xFFFFFFFF; \
0N/A c03 = c[2] & 0xFFFFFFFF; c04 = c[3] & 0xFFFFFFFF; \
0N/A dc01= vis_to_double(c01, c02); \
0N/A dc02= vis_to_double(c03, c04); \
0N/A } \
0N/A } \
0N/A \
0N/A if ((width > stride) || (width > strided)) \
0N/A return MLIB_FAILURE
0N/A
0N/A/***************************************************************/
0N/A
0N/Astatic mlib_status mlib_v_ImageConstLogic(mlib_image *dst,
0N/A mlib_image *src,
0N/A mlib_s32 *c)
0N/A{
0N/A mlib_s32 i, j;
0N/A mlib_s32 offdst, offsrc, emask;
0N/A mlib_d64 *dpp, *spp;
0N/A mlib_d64 sa1, sa2, da, sa;
0N/A mlib_d64 ssa, ssa1, ssa2, sa3, sa4;
0N/A mlib_s32 amount;
0N/A mlib_u8 *dend;
0N/A mlib_d64 c1, c2, c3;
0N/A
0N/A VALIDATE();
0N/A
0N/A if (nchannels == 3) {
0N/A if ((width == stride) && (width == strided) && ((width - (width / 3) * 3) == 0)) {
0N/A
0N/A amount = height * width;
0N/A dend = dp + amount - 1;
0N/A offdst = ((mlib_addr) dp) & 7;
0N/A offsrc = ((mlib_addr) sp) & 7;
0N/A
0N/A if (offsrc == offdst) {
0N/A
0N/A /* prepare the destination addresses */
0N/A dpp = (mlib_d64 *) vis_alignaddr(dp, 0);
0N/A i = (mlib_u8 *) dpp - dp;
0N/A
0N/A if (i != 0) {
0N/A vis_alignaddr((void *)(8 - offdst), 0);
0N/A c3 = vis_faligndata(dc03, dc01);
0N/A c1 = vis_faligndata(dc01, dc02);
0N/A c2 = vis_faligndata(dc02, dc03);
0N/A }
0N/A else {
0N/A c1 = dc01;
0N/A c2 = dc02;
0N/A c3 = dc03;
0N/A }
0N/A
0N/A /* prepare the destination addresses */
0N/A spp = (mlib_d64 *) vis_alignaddr(sp, 0);
0N/A
0N/A if (i != 0) {
0N/A /* generate edge mask for the start point */
0N/A emask = vis_edge8(dp, dend);
0N/A sa1 = *spp++;
0N/A da = VIS_CONSTLOGIC(c3, sa1);
0N/A vis_pst_8(da, dpp++, emask);
0N/A i += 8;
0N/A }
0N/A
0N/A#pragma pipeloop(0)
0N/A for (; i < amount - 24; i += 24) {
0N/A dpp[0] = VIS_CONSTLOGIC(c1, spp[0]);
0N/A dpp[1] = VIS_CONSTLOGIC(c2, spp[1]);
0N/A dpp[2] = VIS_CONSTLOGIC(c3, spp[2]);
0N/A dpp += 3;
0N/A spp += 3;
0N/A }
0N/A
0N/A if (i < amount) {
0N/A emask = vis_edge8(dpp, dend);
0N/A sa1 = *spp++;
0N/A da = VIS_CONSTLOGIC(c1, sa1);
0N/A vis_pst_8(da, dpp++, emask);
0N/A i += 8;
0N/A }
0N/A
0N/A if (i < amount) {
0N/A emask = vis_edge8(dpp, dend);
0N/A sa1 = *spp++;
0N/A da = VIS_CONSTLOGIC(c2, sa1);
0N/A vis_pst_8(da, dpp++, emask);
0N/A i += 8;
0N/A }
0N/A
0N/A if (i < amount) {
0N/A emask = vis_edge8(dpp, dend);
0N/A sa1 = *spp++;
0N/A da = VIS_CONSTLOGIC(c3, sa1);
0N/A vis_pst_8(da, dpp, emask);
0N/A }
0N/A }
0N/A else {
0N/A /* prepare the destination addresses */
0N/A dpp = (mlib_d64 *) vis_alignaddr(dp, 0);
0N/A i = (mlib_u8 *) dpp - dp;
0N/A
0N/A if (i != 0) {
0N/A vis_alignaddr((void *)(8 - offdst), 0);
0N/A c3 = vis_faligndata(dc03, dc01);
0N/A c1 = vis_faligndata(dc01, dc02);
0N/A c2 = vis_faligndata(dc02, dc03);
0N/A }
0N/A else {
0N/A c1 = dc01;
0N/A c2 = dc02;
0N/A c3 = dc03;
0N/A }
0N/A
0N/A /* prepare the destination addresses */
0N/A spp = (mlib_d64 *) vis_alignaddr(sp, i);
0N/A
0N/A sa1 = spp[0];
0N/A
0N/A if (i != 0) {
0N/A /* generate edge mask for the start point */
0N/A emask = vis_edge8(dp, dend);
0N/A sa2 = spp[1];
0N/A sa = vis_faligndata(sa1, sa2);
0N/A da = VIS_CONSTLOGIC(c3, sa);
0N/A vis_pst_8(da, dpp++, emask);
0N/A sa1 = sa2;
0N/A i += 8;
0N/A spp++;
0N/A }
0N/A
0N/A#pragma pipeloop(0)
0N/A for (; i < amount - 24; i += 24) {
0N/A sa2 = spp[1];
0N/A ssa = vis_faligndata(sa1, sa2);
0N/A dpp[0] = VIS_CONSTLOGIC(c1, ssa);
0N/A sa3 = spp[2];
0N/A ssa1 = vis_faligndata(sa2, sa3);
0N/A dpp[1] = VIS_CONSTLOGIC(c2, ssa1);
0N/A sa4 = spp[3];
0N/A ssa2 = vis_faligndata(sa3, sa4);
0N/A dpp[2] = VIS_CONSTLOGIC(c3, ssa2);
0N/A sa1 = sa4;
0N/A dpp += 3;
0N/A spp += 3;
0N/A }
0N/A
0N/A if (i < amount) {
0N/A emask = vis_edge8(dpp, dend);
0N/A sa2 = spp[1];
0N/A sa = vis_faligndata(sa1, sa2);
0N/A da = VIS_CONSTLOGIC(c1, sa);
0N/A vis_pst_8(da, dpp++, emask);
0N/A sa1 = sa2;
0N/A i += 8;
0N/A spp++;
0N/A }
0N/A
0N/A if (i < amount) {
0N/A emask = vis_edge8(dpp, dend);
0N/A sa2 = spp[1];
0N/A sa = vis_faligndata(sa1, sa2);
0N/A da = VIS_CONSTLOGIC(c2, sa);
0N/A vis_pst_8(da, dpp++, emask);
0N/A sa1 = sa2;
0N/A i += 8;
0N/A spp++;
0N/A }
0N/A
0N/A if (i < amount) {
0N/A emask = vis_edge8(dpp, dend);
0N/A sa2 = spp[1];
0N/A sa = vis_faligndata(sa1, sa2);
0N/A da = VIS_CONSTLOGIC(c3, sa);
0N/A vis_pst_8(da, dpp++, emask);
0N/A }
0N/A }
0N/A }
0N/A else {
0N/A
0N/A sl = sp;
0N/A dl = dp;
0N/A
0N/A amount = width;
0N/A
0N/A for (j = 0; j < height; j++) {
0N/A
0N/A dend = dp + amount - 1;
0N/A offdst = ((mlib_addr) dp) & 7;
0N/A offsrc = ((mlib_addr) sp) & 7;
0N/A
0N/A if (offsrc == offdst) {
0N/A
0N/A /* prepare the destination addresses */
0N/A dpp = (mlib_d64 *) vis_alignaddr(dp, 0);
0N/A i = (mlib_u8 *) dpp - dp;
0N/A
0N/A if (i != 0) {
0N/A vis_alignaddr((void *)(8 - offdst), 0);
0N/A c3 = vis_faligndata(dc03, dc01);
0N/A c1 = vis_faligndata(dc01, dc02);
0N/A c2 = vis_faligndata(dc02, dc03);
0N/A }
0N/A else {
0N/A c1 = dc01;
0N/A c2 = dc02;
0N/A c3 = dc03;
0N/A }
0N/A
0N/A /* prepare the destination addresses */
0N/A spp = (mlib_d64 *) vis_alignaddr(sp, 0);
0N/A
0N/A if (i != 0) {
0N/A /* generate edge mask for the start point */
0N/A emask = vis_edge8(dp, dend);
0N/A sa1 = *spp++;
0N/A da = VIS_CONSTLOGIC(c3, sa1);
0N/A vis_pst_8(da, dpp++, emask);
0N/A i += 8;
0N/A }
0N/A
0N/A#pragma pipeloop(0)
0N/A for (; i < amount - 24; i += 24) {
0N/A dpp[0] = VIS_CONSTLOGIC(c1, spp[0]);
0N/A dpp[1] = VIS_CONSTLOGIC(c2, spp[1]);
0N/A dpp[2] = VIS_CONSTLOGIC(c3, spp[2]);
0N/A dpp += 3;
0N/A spp += 3;
0N/A }
0N/A
0N/A if (i < amount) {
0N/A emask = vis_edge8(dpp, dend);
0N/A sa1 = *spp++;
0N/A da = VIS_CONSTLOGIC(c1, sa1);
0N/A vis_pst_8(da, dpp++, emask);
0N/A i += 8;
0N/A }
0N/A
0N/A if (i < amount) {
0N/A emask = vis_edge8(dpp, dend);
0N/A sa1 = *spp++;
0N/A da = VIS_CONSTLOGIC(c2, sa1);
0N/A vis_pst_8(da, dpp++, emask);
0N/A i += 8;
0N/A }
0N/A
0N/A if (i < amount) {
0N/A emask = vis_edge8(dpp, dend);
0N/A sa1 = *spp++;
0N/A da = VIS_CONSTLOGIC(c3, sa1);
0N/A vis_pst_8(da, dpp, emask);
0N/A }
0N/A }
0N/A else {
0N/A /* prepare the destination addresses */
0N/A dpp = (mlib_d64 *) vis_alignaddr(dp, 0);
0N/A i = (mlib_u8 *) dpp - dp;
0N/A
0N/A if (i != 0) {
0N/A vis_alignaddr((void *)(8 - offdst), 0);
0N/A c3 = vis_faligndata(dc03, dc01);
0N/A c1 = vis_faligndata(dc01, dc02);
0N/A c2 = vis_faligndata(dc02, dc03);
0N/A }
0N/A else {
0N/A c1 = dc01;
0N/A c2 = dc02;
0N/A c3 = dc03;
0N/A }
0N/A
0N/A /* prepare the destination addresses */
0N/A spp = (mlib_d64 *) vis_alignaddr(sp, i);
0N/A
0N/A sa1 = spp[0];
0N/A
0N/A if (i != 0) {
0N/A /* generate edge mask for the start point */
0N/A emask = vis_edge8(dp, dend);
0N/A sa2 = spp[1];
0N/A sa = vis_faligndata(sa1, sa2);
0N/A da = VIS_CONSTLOGIC(c3, sa);
0N/A vis_pst_8(da, dpp++, emask);
0N/A sa1 = sa2;
0N/A i += 8;
0N/A spp++;
0N/A }
0N/A
0N/A#pragma pipeloop(0)
0N/A for (; i < amount - 24; i += 24) {
0N/A sa2 = spp[1];
0N/A sa = vis_faligndata(sa1, sa2);
0N/A dpp[0] = VIS_CONSTLOGIC(c1, sa);
0N/A sa1 = spp[2];
0N/A sa = vis_faligndata(sa2, sa1);
0N/A dpp[1] = VIS_CONSTLOGIC(c2, sa);
0N/A sa2 = spp[3];
0N/A sa = vis_faligndata(sa1, sa2);
0N/A dpp[2] = VIS_CONSTLOGIC(c3, sa);
0N/A sa1 = sa2;
0N/A dpp += 3;
0N/A spp += 3;
0N/A }
0N/A
0N/A if (i < amount) {
0N/A emask = vis_edge8(dpp, dend);
0N/A sa2 = spp[1];
0N/A sa = vis_faligndata(sa1, sa2);
0N/A da = VIS_CONSTLOGIC(c1, sa);
0N/A vis_pst_8(da, dpp++, emask);
0N/A sa1 = sa2;
0N/A i += 8;
0N/A spp++;
0N/A }
0N/A
0N/A if (i < amount) {
0N/A emask = vis_edge8(dpp, dend);
0N/A sa2 = spp[1];
0N/A sa = vis_faligndata(sa1, sa2);
0N/A da = VIS_CONSTLOGIC(c2, sa);
0N/A vis_pst_8(da, dpp++, emask);
0N/A sa1 = sa2;
0N/A i += 8;
0N/A spp++;
0N/A }
0N/A
0N/A if (i < amount) {
0N/A emask = vis_edge8(dpp, dend);
0N/A sa2 = spp[1];
0N/A sa = vis_faligndata(sa1, sa2);
0N/A da = VIS_CONSTLOGIC(c3, sa);
0N/A vis_pst_8(da, dpp++, emask);
0N/A }
0N/A }
0N/A
0N/A sp = sl += stride;
0N/A dp = dl += strided;
0N/A }
0N/A }
0N/A
0N/A }
0N/A else if ((type != MLIB_INT) || (nchannels != 4)) {
0N/A
0N/A if ((width == stride) && (width == strided)) {
0N/A
0N/A amount = height * width;
0N/A dend = dp + amount - 1;
0N/A offdst = ((mlib_addr) dp) & 7;
0N/A offsrc = ((mlib_addr) sp) & 7;
0N/A
0N/A if (offsrc == offdst) {
0N/A
0N/A /* prepare the destination addresses */
0N/A dpp = (mlib_d64 *) vis_alignaddr(dp, 0);
0N/A i = (mlib_u8 *) dpp - dp;
0N/A
0N/A if (i != 0) {
0N/A vis_alignaddr((void *)(8 - offdst), 0);
0N/A c1 = vis_faligndata(dc01, dc01);
0N/A }
0N/A else {
0N/A c1 = dc01;
0N/A }
0N/A
0N/A /* prepare the destination addresses */
0N/A spp = (mlib_d64 *) vis_alignaddr(sp, 0);
0N/A
0N/A if (i != 0) {
0N/A /* generate edge mask for the start point */
0N/A emask = vis_edge8(dp, dend);
0N/A sa1 = *spp++;
0N/A da = VIS_CONSTLOGIC(c1, sa1);
0N/A vis_pst_8(da, dpp++, emask);
0N/A i += 8;
0N/A }
0N/A
0N/A#pragma pipeloop(0)
0N/A for (; i < amount - 8; i += 8) {
0N/A *dpp++ = VIS_CONSTLOGIC(c1, *spp);
0N/A spp++;
0N/A }
0N/A
0N/A if (i < amount) {
0N/A emask = vis_edge8(dpp, dend);
0N/A sa1 = *spp;
0N/A da = VIS_CONSTLOGIC(c1, sa1);
0N/A vis_pst_8(da, dpp, emask);
0N/A }
0N/A }
0N/A else {
0N/A /* prepare the destination addresses */
0N/A dpp = (mlib_d64 *) vis_alignaddr(dp, 0);
0N/A i = (mlib_u8 *) dpp - dp;
0N/A
0N/A if (i != 0) {
0N/A vis_alignaddr((void *)(8 - offdst), 0);
0N/A c1 = vis_faligndata(dc01, dc01);
0N/A }
0N/A else {
0N/A c1 = dc01;
0N/A }
0N/A
0N/A /* prepare the destination addresses */
0N/A spp = (mlib_d64 *) vis_alignaddr(sp, i);
0N/A
0N/A sa1 = spp[0];
0N/A
0N/A if (i != 0) {
0N/A /* generate edge mask for the start point */
0N/A emask = vis_edge8(dp, dend);
0N/A sa2 = spp[1];
0N/A sa = vis_faligndata(sa1, sa2);
0N/A da = VIS_CONSTLOGIC(c1, sa);
0N/A vis_pst_8(da, dpp++, emask);
0N/A sa1 = sa2;
0N/A i += 8;
0N/A spp++;
0N/A }
0N/A
0N/A#pragma pipeloop(0)
0N/A for (; i < amount - 8; i += 8) {
0N/A sa2 = spp[1];
0N/A sa = vis_faligndata(sa1, sa2);
0N/A *dpp++ = VIS_CONSTLOGIC(c1, sa);
0N/A sa1 = sa2;
0N/A spp++;
0N/A }
0N/A
0N/A if (i < amount) {
0N/A emask = vis_edge8(dpp, dend);
0N/A sa2 = spp[1];
0N/A sa = vis_faligndata(sa1, sa2);
0N/A da = VIS_CONSTLOGIC(c1, sa);
0N/A vis_pst_8(da, dpp, emask);
0N/A }
0N/A }
0N/A }
0N/A else {
0N/A
0N/A sl = sp;
0N/A dl = dp;
0N/A
0N/A amount = width;
0N/A
0N/A for (j = 0; j < height; j++) {
0N/A
0N/A dend = dp + amount - 1;
0N/A offdst = ((mlib_addr) dp) & 7;
0N/A offsrc = ((mlib_addr) sp) & 7;
0N/A
0N/A if (offsrc == offdst) {
0N/A
0N/A /* prepare the destination addresses */
0N/A dpp = (mlib_d64 *) vis_alignaddr(dp, 0);
0N/A i = (mlib_u8 *) dpp - dp;
0N/A
0N/A if (i != 0) {
0N/A vis_alignaddr((void *)(8 - offdst), 0);
0N/A c1 = vis_faligndata(dc01, dc01);
0N/A }
0N/A else {
0N/A c1 = dc01;
0N/A }
0N/A
0N/A /* prepare the destination addresses */
0N/A spp = (mlib_d64 *) vis_alignaddr(sp, 0);
0N/A
0N/A if (i != 0) {
0N/A /* generate edge mask for the start point */
0N/A emask = vis_edge8(dp, dend);
0N/A sa1 = *spp++;
0N/A da = VIS_CONSTLOGIC(c1, sa1);
0N/A vis_pst_8(da, dpp++, emask);
0N/A i += 8;
0N/A }
0N/A
0N/A#pragma pipeloop(0)
0N/A for (; i < amount - 8; i += 8) {
0N/A *dpp++ = VIS_CONSTLOGIC(c1, *spp);
0N/A spp++;
0N/A }
0N/A
0N/A if (i < amount) {
0N/A emask = vis_edge8(dpp, dend);
0N/A sa1 = *spp;
0N/A da = VIS_CONSTLOGIC(c1, sa1);
0N/A vis_pst_8(da, dpp, emask);
0N/A }
0N/A }
0N/A else {
0N/A /* prepare the destination addresses */
0N/A dpp = (mlib_d64 *) vis_alignaddr(dp, 0);
0N/A i = (mlib_u8 *) dpp - dp;
0N/A
0N/A if (i != 0) {
0N/A vis_alignaddr((void *)(8 - offdst), 0);
0N/A c1 = vis_faligndata(dc01, dc01);
0N/A }
0N/A else {
0N/A c1 = dc01;
0N/A }
0N/A
0N/A /* prepare the destination addresses */
0N/A spp = (mlib_d64 *) vis_alignaddr(sp, i);
0N/A
0N/A sa1 = spp[0];
0N/A
0N/A if (i != 0) {
0N/A /* generate edge mask for the start point */
0N/A emask = vis_edge8(dp, dend);
0N/A sa2 = spp[1];
0N/A sa = vis_faligndata(sa1, sa2);
0N/A da = VIS_CONSTLOGIC(c1, sa);
0N/A vis_pst_8(da, dpp++, emask);
0N/A sa1 = sa2;
0N/A i += 8;
0N/A spp++;
0N/A }
0N/A
0N/A#pragma pipeloop(0)
0N/A for (; i < amount - 8; i += 8) {
0N/A sa2 = spp[1];
0N/A sa = vis_faligndata(sa1, sa2);
0N/A *dpp++ = VIS_CONSTLOGIC(c1, sa);
0N/A sa1 = sa2;
0N/A spp++;
0N/A }
0N/A
0N/A if (i < amount) {
0N/A emask = vis_edge8(dpp, dend);
0N/A sa2 = spp[1];
0N/A sa = vis_faligndata(sa1, sa2);
0N/A da = VIS_CONSTLOGIC(c1, sa);
0N/A vis_pst_8(da, dpp, emask);
0N/A }
0N/A }
0N/A
0N/A sp = sl += stride;
0N/A dp = dl += strided;
0N/A }
0N/A }
0N/A
0N/A }
0N/A else {
0N/A
0N/A if ((width == stride) && (width == strided)) {
0N/A
0N/A amount = height * width;
0N/A dend = dp + amount - 1;
0N/A offdst = ((mlib_addr) dp) & 7;
0N/A offsrc = ((mlib_addr) sp) & 7;
0N/A
0N/A if (offsrc == offdst) {
0N/A
0N/A /* prepare the destination addresses */
0N/A dpp = (mlib_d64 *) vis_alignaddr(dp, 0);
0N/A i = (mlib_u8 *) dpp - dp;
0N/A
0N/A if (i != 0) {
0N/A vis_alignaddr((void *)(8 - offdst), 0);
0N/A c2 = vis_faligndata(dc02, dc01);
0N/A c1 = vis_faligndata(dc01, dc02);
0N/A }
0N/A else {
0N/A c1 = dc01;
0N/A c2 = dc02;
0N/A }
0N/A
0N/A /* prepare the destination addresses */
0N/A spp = (mlib_d64 *) vis_alignaddr(sp, 0);
0N/A
0N/A if (i != 0) {
0N/A /* generate edge mask for the start point */
0N/A emask = vis_edge8(dp, dend);
0N/A sa1 = *spp++;
0N/A da = VIS_CONSTLOGIC(c2, sa1);
0N/A vis_pst_8(da, dpp++, emask);
0N/A i += 8;
0N/A }
0N/A
0N/A#pragma pipeloop(0)
0N/A for (; i < amount - 16; i += 16) {
0N/A dpp[0] = VIS_CONSTLOGIC(c1, spp[0]);
0N/A dpp[1] = VIS_CONSTLOGIC(c2, spp[1]);
0N/A dpp += 2;
0N/A spp += 2;
0N/A }
0N/A
0N/A if (i < amount) {
0N/A emask = vis_edge8(dpp, dend);
0N/A sa1 = *spp++;
0N/A da = VIS_CONSTLOGIC(c1, sa1);
0N/A vis_pst_8(da, dpp++, emask);
0N/A i += 8;
0N/A }
0N/A
0N/A if (i < amount) {
0N/A emask = vis_edge8(dpp, dend);
0N/A sa1 = *spp;
0N/A da = VIS_CONSTLOGIC(c2, sa1);
0N/A vis_pst_8(da, dpp++, emask);
0N/A }
0N/A }
0N/A else {
0N/A /* prepare the destination addresses */
0N/A dpp = (mlib_d64 *) vis_alignaddr(dp, 0);
0N/A i = (mlib_u8 *) dpp - dp;
0N/A
0N/A if (i != 0) {
0N/A vis_alignaddr((void *)(8 - offdst), 0);
0N/A c2 = vis_faligndata(dc02, dc01);
0N/A c1 = vis_faligndata(dc01, dc02);
0N/A }
0N/A else {
0N/A c1 = dc01;
0N/A c2 = dc02;
0N/A }
0N/A
0N/A /* prepare the destination addresses */
0N/A spp = (mlib_d64 *) vis_alignaddr(sp, i);
0N/A
0N/A sa1 = spp[0];
0N/A
0N/A if (i != 0) {
0N/A /* generate edge mask for the start point */
0N/A emask = vis_edge8(dp, dend);
0N/A sa2 = spp[1];
0N/A sa = vis_faligndata(sa1, sa2);
0N/A da = VIS_CONSTLOGIC(c2, sa);
0N/A vis_pst_8(da, dpp++, emask);
0N/A sa1 = sa2;
0N/A i += 8;
0N/A spp++;
0N/A }
0N/A
0N/A#pragma pipeloop(0)
0N/A for (; i < amount - 16; i += 16) {
0N/A sa2 = spp[1];
0N/A ssa = vis_faligndata(sa1, sa2);
0N/A dpp[0] = VIS_CONSTLOGIC(c1, ssa);
0N/A sa3 = spp[2];
0N/A ssa1 = vis_faligndata(sa2, sa3);
0N/A dpp[1] = VIS_CONSTLOGIC(c2, ssa1);
0N/A sa1 = sa3;
0N/A dpp += 2;
0N/A spp += 2;
0N/A }
0N/A
0N/A if (i < amount) {
0N/A emask = vis_edge8(dpp, dend);
0N/A sa2 = spp[1];
0N/A sa = vis_faligndata(sa1, sa2);
0N/A da = VIS_CONSTLOGIC(c1, sa);
0N/A vis_pst_8(da, dpp++, emask);
0N/A sa1 = sa2;
0N/A i += 8;
0N/A spp++;
0N/A }
0N/A
0N/A if (i < amount) {
0N/A emask = vis_edge8(dpp, dend);
0N/A sa2 = spp[1];
0N/A sa = vis_faligndata(sa1, sa2);
0N/A da = VIS_CONSTLOGIC(c2, sa);
0N/A vis_pst_8(da, dpp++, emask);
0N/A }
0N/A }
0N/A }
0N/A else {
0N/A
0N/A sl = sp;
0N/A dl = dp;
0N/A
0N/A amount = width;
0N/A
0N/A for (j = 0; j < height; j++) {
0N/A
0N/A dend = dp + amount - 1;
0N/A offdst = ((mlib_addr) dp) & 7;
0N/A offsrc = ((mlib_addr) sp) & 7;
0N/A
0N/A if (offsrc == offdst) {
0N/A
0N/A /* prepare the destination addresses */
0N/A dpp = (mlib_d64 *) vis_alignaddr(dp, 0);
0N/A i = (mlib_u8 *) dpp - dp;
0N/A
0N/A if (i != 0) {
0N/A vis_alignaddr((void *)(8 - offdst), 0);
0N/A c2 = vis_faligndata(dc02, dc01);
0N/A c1 = vis_faligndata(dc01, dc02);
0N/A }
0N/A else {
0N/A c1 = dc01;
0N/A c2 = dc02;
0N/A }
0N/A
0N/A /* prepare the destination addresses */
0N/A spp = (mlib_d64 *) vis_alignaddr(sp, 0);
0N/A
0N/A if (i != 0) {
0N/A /* generate edge mask for the start point */
0N/A emask = vis_edge8(dp, dend);
0N/A sa1 = *spp++;
0N/A da = VIS_CONSTLOGIC(c2, sa1);
0N/A vis_pst_8(da, dpp++, emask);
0N/A i += 8;
0N/A }
0N/A
0N/A#pragma pipeloop(0)
0N/A for (; i < amount - 16; i += 16) {
0N/A dpp[0] = VIS_CONSTLOGIC(c1, spp[0]);
0N/A dpp[1] = VIS_CONSTLOGIC(c2, spp[1]);
0N/A dpp += 2;
0N/A spp += 2;
0N/A }
0N/A
0N/A if (i < amount) {
0N/A emask = vis_edge8(dpp, dend);
0N/A sa1 = *spp++;
0N/A da = VIS_CONSTLOGIC(c1, sa1);
0N/A vis_pst_8(da, dpp++, emask);
0N/A i += 8;
0N/A }
0N/A
0N/A if (i < amount) {
0N/A emask = vis_edge8(dpp, dend);
0N/A sa1 = *spp;
0N/A da = VIS_CONSTLOGIC(c2, sa1);
0N/A vis_pst_8(da, dpp++, emask);
0N/A }
0N/A }
0N/A else {
0N/A /* prepare the destination addresses */
0N/A dpp = (mlib_d64 *) vis_alignaddr(dp, 0);
0N/A i = (mlib_u8 *) dpp - dp;
0N/A
0N/A if (i != 0) {
0N/A vis_alignaddr((void *)(8 - offdst), 0);
0N/A c2 = vis_faligndata(dc02, dc01);
0N/A c1 = vis_faligndata(dc01, dc02);
0N/A }
0N/A else {
0N/A c1 = dc01;
0N/A c2 = dc02;
0N/A }
0N/A
0N/A /* prepare the destination addresses */
0N/A spp = (mlib_d64 *) vis_alignaddr(sp, i);
0N/A
0N/A sa1 = spp[0];
0N/A
0N/A if (i != 0) {
0N/A /* generate edge mask for the start point */
0N/A emask = vis_edge8(dp, dend);
0N/A sa2 = spp[1];
0N/A sa = vis_faligndata(sa1, sa2);
0N/A da = VIS_CONSTLOGIC(c2, sa);
0N/A vis_pst_8(da, dpp++, emask);
0N/A sa1 = sa2;
0N/A i += 8;
0N/A spp++;
0N/A }
0N/A
0N/A#pragma pipeloop(0)
0N/A for (; i < amount - 16; i += 16) {
0N/A sa2 = spp[1];
0N/A ssa = vis_faligndata(sa1, sa2);
0N/A dpp[0] = VIS_CONSTLOGIC(c1, ssa);
0N/A sa3 = spp[2];
0N/A ssa1 = vis_faligndata(sa2, sa3);
0N/A dpp[1] = VIS_CONSTLOGIC(c2, ssa1);
0N/A sa1 = sa3;
0N/A dpp += 2;
0N/A spp += 2;
0N/A }
0N/A
0N/A if (i < amount) {
0N/A emask = vis_edge8(dpp, dend);
0N/A sa2 = spp[1];
0N/A sa = vis_faligndata(sa1, sa2);
0N/A da = VIS_CONSTLOGIC(c1, sa);
0N/A vis_pst_8(da, dpp++, emask);
0N/A sa1 = sa2;
0N/A i += 8;
0N/A spp++;
0N/A }
0N/A
0N/A if (i < amount) {
0N/A emask = vis_edge8(dpp, dend);
0N/A sa2 = spp[1];
0N/A sa = vis_faligndata(sa1, sa2);
0N/A da = VIS_CONSTLOGIC(c2, sa);
0N/A vis_pst_8(da, dpp++, emask);
0N/A }
0N/A }
0N/A
0N/A sp = sl += stride;
0N/A dp = dl += strided;
0N/A }
0N/A }
0N/A }
0N/A
0N/A return MLIB_SUCCESS;
0N/A}
0N/A
0N/A/***************************************************************/
0N/A
0N/A#ifdef __cplusplus
0N/A}
0N/A#endif /* __cplusplus */
0N/A#endif /* __MLIB_V_IMAGECONSTLOGIC_H */