/* * Copyright (c) 2003, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it * under the terms of the GNU General Public License version 2 only, as * published by the Free Software Foundation. Oracle designates this * particular file as subject to the "Classpath" exception as provided * by Oracle in the LICENSE file that accompanied this code. * * This code is distributed in the hope that it will be useful, but WITHOUT * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License * version 2 for more details (a copy is included in the LICENSE file that * accompanied this code). * * You should have received a copy of the GNU General Public License version * 2 along with this work; if not, write to the Free Software Foundation, * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. * * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA * or visit www.oracle.com if you need additional information or have any * questions. */ #if !defined(JAVA2D_NO_MLIB) || defined(MLIB_ADD_SUFF) #include "vis_AlphaMacros.h" /***************************************************************/ #define Gray2RGBx(x) \ (x << 24) | (x << 16) | (x << 8) /***************************************************************/ #define READ_RGBx(i) \ (src[3*i + 2] << 24) | (src[3*i + 1] << 16) | (src[3*i] << 8) /***************************************************************/ void ADD_SUFF(IntRgbxToIntArgbConvert)(BLIT_PARAMS) { mlib_s32 dstScan = pDstInfo->scanStride; mlib_s32 srcScan = pSrcInfo->scanStride; mlib_d64 dd, mask; mlib_s32 i, i0, j; if (dstScan == 4*width && srcScan == 4*width) { width *= height; height = 1; } mask = vis_to_double_dup(0xFF000000); vis_alignaddr(NULL, 7); for (j = 0; j < height; j++) { mlib_u32 *src = srcBase; mlib_u32 *dst = dstBase; i = i0 = 0; if ((mlib_s32)dst & 7) { dst[i] = 0xff000000 | (src[i] >> 8); i0 = 1; } #pragma pipeloop(0) for (i = i0; i <= (mlib_s32)width - 2; i += 2) { dd = vis_freg_pair(((mlib_f32*)src)[i], ((mlib_f32*)src)[i + 1]); dd = vis_faligndata(dd, dd); *(mlib_d64*)(dst + i) = vis_for(dd, mask); } if (i < width) { dst[i] = 0xff000000 | (src[i] >> 8); } PTR_ADD(dstBase, dstScan); PTR_ADD(srcBase, srcScan); } } /***************************************************************/ void ADD_SUFF(IntRgbxToIntArgbScaleConvert)(SCALE_PARAMS) { mlib_s32 dstScan = pDstInfo->scanStride; mlib_s32 srcScan = pSrcInfo->scanStride; mlib_d64 dd, mask; mlib_s32 j; mask = vis_to_double_dup(0xFF000000); vis_alignaddr(NULL, 7); for (j = 0; j < height; j++) { mlib_u32 *src = srcBase; mlib_u32 *dst = dstBase; mlib_u32 *dst_end = dst + width; mlib_s32 tmpsxloc = sxloc; PTR_ADD(src, (syloc >> shift) * srcScan); if ((mlib_s32)dst & 7) { *dst++ = 0xff000000 | (src[tmpsxloc >> shift] >> 8); tmpsxloc += sxinc; } #pragma pipeloop(0) for (; dst <= dst_end - 2; dst += 2) { dd = vis_freg_pair(((mlib_f32*)src)[tmpsxloc >> shift], ((mlib_f32*)src)[(tmpsxloc + sxinc) >> shift]); dd = vis_faligndata(dd, dd); *(mlib_d64*)dst = vis_for(dd, mask); tmpsxloc += 2*sxinc; } for (; dst < dst_end; dst++) { *dst++ = 0xff000000 | (src[tmpsxloc >> shift] >> 8); tmpsxloc += sxinc; } PTR_ADD(dstBase, dstScan); syloc += syinc; } } /***************************************************************/ void ADD_SUFF(IntArgbToIntRgbxConvert)(BLIT_PARAMS) { mlib_s32 dstScan = pDstInfo->scanStride; mlib_s32 srcScan = pSrcInfo->scanStride; mlib_d64 dd, mask; mlib_s32 i, i0, j; if (dstScan == 4*width && srcScan == 4*width) { width *= height; height = 1; } mask = vis_to_double_dup(0xFFFFFF00); vis_alignaddr(NULL, 1); for (j = 0; j < height; j++) { mlib_u32 *src = srcBase; mlib_u32 *dst = dstBase; i = i0 = 0; if ((mlib_s32)dst & 7) { dst[i] = src[i] << 8; i0 = 1; } #pragma pipeloop(0) for (i = i0; i <= (mlib_s32)width - 2; i += 2) { dd = vis_freg_pair(((mlib_f32*)src)[i], ((mlib_f32*)src)[i + 1]); dd = vis_faligndata(dd, dd); *(mlib_d64*)(dst + i) = vis_fand(dd, mask); } if (i < width) { dst[i] = src[i] << 8; } PTR_ADD(dstBase, dstScan); PTR_ADD(srcBase, srcScan); } } /***************************************************************/ void ADD_SUFF(IntArgbToIntRgbxScaleConvert)(SCALE_PARAMS) { mlib_s32 dstScan = pDstInfo->scanStride; mlib_s32 srcScan = pSrcInfo->scanStride; mlib_d64 dd, mask; mlib_s32 j; mask = vis_to_double_dup(0xFFFFFF00); vis_alignaddr(NULL, 1); for (j = 0; j < height; j++) { mlib_u32 *src = srcBase; mlib_u32 *dst = dstBase; mlib_u32 *dst_end = dst + width; mlib_s32 tmpsxloc = sxloc; PTR_ADD(src, (syloc >> shift) * srcScan); if ((mlib_s32)dst & 7) { *dst++ = src[tmpsxloc >> shift] << 8; tmpsxloc += sxinc; } #pragma pipeloop(0) for (; dst <= dst_end - 2; dst += 2) { dd = vis_freg_pair(((mlib_f32*)src)[tmpsxloc >> shift], ((mlib_f32*)src)[(tmpsxloc + sxinc) >> shift]); dd = vis_faligndata(dd, dd); *(mlib_d64*)dst = vis_fand(dd, mask); tmpsxloc += 2*sxinc; } for (; dst < dst_end; dst++) { *dst++ = src[tmpsxloc >> shift] << 8; tmpsxloc += sxinc; } PTR_ADD(dstBase, dstScan); syloc += syinc; } } /***************************************************************/ #define BGR_TO_RGBx { \ mlib_d64 sda, sdb, sdc, sdd, sde, sdf; \ mlib_d64 a13, b13, a02, b02; \ \ sda = vis_fpmerge(vis_read_hi(sd0), vis_read_lo(sd1)); \ sdb = vis_fpmerge(vis_read_lo(sd0), vis_read_hi(sd2)); \ sdc = vis_fpmerge(vis_read_hi(sd1), vis_read_lo(sd2)); \ \ sdd = vis_fpmerge(vis_read_hi(sda), vis_read_lo(sdb)); \ sde = vis_fpmerge(vis_read_lo(sda), vis_read_hi(sdc)); \ sdf = vis_fpmerge(vis_read_hi(sdb), vis_read_lo(sdc)); \ \ s_2 = vis_fpmerge(vis_read_hi(sdd), vis_read_lo(sde)); \ s_1 = vis_fpmerge(vis_read_lo(sdd), vis_read_hi(sdf)); \ s_0 = vis_fpmerge(vis_read_hi(sde), vis_read_lo(sdf)); \ \ a13 = vis_fpmerge(vis_read_hi(s_1), vis_read_hi(s_3)); \ b13 = vis_fpmerge(vis_read_lo(s_1), vis_read_lo(s_3)); \ a02 = vis_fpmerge(vis_read_hi(s_0), vis_read_hi(s_2)); \ b02 = vis_fpmerge(vis_read_lo(s_0), vis_read_lo(s_2)); \ \ dd0 = vis_fpmerge(vis_read_hi(a02), vis_read_hi(a13)); \ dd1 = vis_fpmerge(vis_read_lo(a02), vis_read_lo(a13)); \ dd2 = vis_fpmerge(vis_read_hi(b02), vis_read_hi(b13)); \ dd3 = vis_fpmerge(vis_read_lo(b02), vis_read_lo(b13)); \ } /***************************************************************/ void ADD_SUFF(ThreeByteBgrToIntRgbxConvert)(BLIT_PARAMS) { mlib_s32 dstScan = pDstInfo->scanStride; mlib_s32 srcScan = pSrcInfo->scanStride; mlib_d64 *sp; mlib_d64 s_0, s_1, s_2, s_3; mlib_d64 s0, s1, s2, s3, sd0, sd1, sd2, dd0, dd1, dd2, dd3; mlib_s32 i, i0, j; if (width < 16) { for (j = 0; j < height; j++) { mlib_u8 *src = srcBase; mlib_u32 *dst = dstBase; for (i = 0; i < width; i++) { dst[i] = READ_RGBx(i); } PTR_ADD(dstBase, dstScan); PTR_ADD(srcBase, srcScan); } return; } if (srcScan == 3*width && dstScan == 4*width) { width *= height; height = 1; } s_3 = vis_fzero(); for (j = 0; j < height; j++) { mlib_u8 *src = srcBase; mlib_f32 *dst = dstBase; i = i0 = 0; if ((mlib_s32)dst & 7) { ((mlib_s32*)dst)[i] = READ_RGBx(i); i0 = 1; } sp = vis_alignaddr(src, 3*i0); s3 = *sp++; #pragma pipeloop(0) for (i = i0; i <= (mlib_s32)width - 8; i += 8) { s0 = s3; s1 = *sp++; s2 = *sp++; s3 = *sp++; sd0 = vis_faligndata(s0, s1); sd1 = vis_faligndata(s1, s2); sd2 = vis_faligndata(s2, s3); BGR_TO_RGBx *(mlib_d64*)(dst + i ) = dd0; *(mlib_d64*)(dst + i + 2) = dd1; *(mlib_d64*)(dst + i + 4) = dd2; *(mlib_d64*)(dst + i + 6) = dd3; } for (; i < width; i++) { ((mlib_s32*)dst)[i] = READ_RGBx(i); } PTR_ADD(dstBase, dstScan); PTR_ADD(srcBase, srcScan); } } /***************************************************************/ void ADD_SUFF(ThreeByteBgrToIntRgbxScaleConvert)(SCALE_PARAMS) { mlib_s32 dstScan = pDstInfo->scanStride; mlib_s32 srcScan = pSrcInfo->scanStride; mlib_d64 dd, dzero; mlib_s32 i, i0, i1, j; if (width < 16) { for (j = 0; j < height; j++) { mlib_u8 *src = srcBase; mlib_s32 *dst = dstBase; mlib_s32 *dst_end = dst + width; mlib_s32 tmpsxloc = sxloc; PTR_ADD(src, (syloc >> shift) * srcScan); for (; dst < dst_end; dst++) { i = tmpsxloc >> shift; tmpsxloc += sxinc; *(mlib_s32*)dst = READ_RGBx(i); } PTR_ADD(dstBase, dstScan); syloc += syinc; } return; } dzero = vis_fzero(); vis_alignaddr(NULL, 7); for (j = 0; j < height; j++) { mlib_u8 *src = srcBase; mlib_f32 *dst = dstBase; mlib_f32 *dst_end = dst + width; mlib_s32 tmpsxloc = sxloc; PTR_ADD(src, (syloc >> shift) * srcScan); if ((mlib_s32)dst & 7) { i = tmpsxloc >> shift; tmpsxloc += sxinc; *(mlib_s32*)dst = READ_RGBx(i); dst++; } #pragma pipeloop(0) for (; dst <= dst_end - 2; dst += 2) { i0 = tmpsxloc >> shift; i1 = (tmpsxloc + sxinc) >> shift; tmpsxloc += 2*sxinc; dd = vis_faligndata(vis_ld_u8(src + 3*i1 ), dzero); dd = vis_faligndata(vis_ld_u8(src + 3*i1 + 1), dd); dd = vis_faligndata(vis_ld_u8(src + 3*i1 + 2), dd); dd = vis_faligndata(dzero, dd); dd = vis_faligndata(vis_ld_u8(src + 3*i0 ), dd); dd = vis_faligndata(vis_ld_u8(src + 3*i0 + 1), dd); dd = vis_faligndata(vis_ld_u8(src + 3*i0 + 2), dd); *(mlib_d64*)dst = dd; } for (; dst < dst_end; dst++) { i = tmpsxloc >> shift; tmpsxloc += sxinc; *(mlib_s32*)dst = READ_RGBx(i); } PTR_ADD(dstBase, dstScan); syloc += syinc; } } /***************************************************************/ void ADD_SUFF(ByteGrayToIntRgbxConvert)(BLIT_PARAMS) { mlib_s32 dstScan = pDstInfo->scanStride; mlib_s32 srcScan = pSrcInfo->scanStride; mlib_d64 d0, d1, d2, d3; mlib_f32 ff, aa = vis_fzero(); mlib_s32 i, j, x; if (width < 8) { for (j = 0; j < height; j++) { mlib_u8 *src = srcBase; mlib_s32 *dst = dstBase; for (i = 0; i < width; i++) { x = src[i]; dst[i] = Gray2RGBx(x); } PTR_ADD(dstBase, dstScan); PTR_ADD(srcBase, srcScan); } return; } if (srcScan == width && dstScan == 4*width) { width *= height; height = 1; } for (j = 0; j < height; j++) { mlib_u8 *src = srcBase; mlib_s32 *dst = dstBase; mlib_s32 *dst_end; dst_end = dst + width; while (((mlib_s32)src & 3) && dst < dst_end) { x = *src++; *dst++ = Gray2RGBx(x); } #pragma pipeloop(0) for (; dst <= (dst_end - 4); dst += 4) { ff = *(mlib_f32*)src; d0 = vis_fpmerge(ff, ff); d1 = vis_fpmerge(ff, aa); d2 = vis_fpmerge(vis_read_hi(d0), vis_read_hi(d1)); d3 = vis_fpmerge(vis_read_lo(d0), vis_read_lo(d1)); ((mlib_f32*)dst)[0] = vis_read_hi(d2); ((mlib_f32*)dst)[1] = vis_read_lo(d2); ((mlib_f32*)dst)[2] = vis_read_hi(d3); ((mlib_f32*)dst)[3] = vis_read_lo(d3); src += 4; } while (dst < dst_end) { x = *src++; *dst++ = Gray2RGBx(x); } PTR_ADD(dstBase, dstScan); PTR_ADD(srcBase, srcScan); } } /***************************************************************/ void ADD_SUFF(ByteGrayToIntRgbxScaleConvert)(SCALE_PARAMS) { mlib_s32 dstScan = pDstInfo->scanStride; mlib_s32 srcScan = pSrcInfo->scanStride; mlib_d64 d0, d1, d2, d3, dd; mlib_f32 ff, aa = vis_fzero(); mlib_s32 i, j, x; if (width < 16) { for (j = 0; j < height; j++) { mlib_u8 *src = srcBase; mlib_s32 *dst = dstBase; mlib_s32 tmpsxloc = sxloc; PTR_ADD(src, (syloc >> shift) * srcScan); for (i = 0; i < width; i++) { x = src[tmpsxloc >> shift]; tmpsxloc += sxinc; dst[i] = Gray2RGBx(x); } PTR_ADD(dstBase, dstScan); syloc += syinc; } return; } vis_alignaddr(NULL, 7); for (j = 0; j < height; j++) { mlib_u8 *src = srcBase; mlib_s32 *dst = dstBase; mlib_s32 *dst_end; mlib_s32 tmpsxloc = sxloc; PTR_ADD(src, (syloc >> shift) * srcScan); dst_end = dst + width; #pragma pipeloop(0) for (; dst <= (dst_end - 4); dst += 4) { LOAD_NEXT_U8(dd, src + ((tmpsxloc + 3*sxinc) >> shift)); LOAD_NEXT_U8(dd, src + ((tmpsxloc + 2*sxinc) >> shift)); LOAD_NEXT_U8(dd, src + ((tmpsxloc + sxinc) >> shift)); LOAD_NEXT_U8(dd, src + ((tmpsxloc ) >> shift)); tmpsxloc += 4*sxinc; ff = vis_read_hi(dd); d0 = vis_fpmerge(ff, ff); d1 = vis_fpmerge(ff, aa); d2 = vis_fpmerge(vis_read_hi(d0), vis_read_hi(d1)); d3 = vis_fpmerge(vis_read_lo(d0), vis_read_lo(d1)); ((mlib_f32*)dst)[0] = vis_read_hi(d2); ((mlib_f32*)dst)[1] = vis_read_lo(d2); ((mlib_f32*)dst)[2] = vis_read_hi(d3); ((mlib_f32*)dst)[3] = vis_read_lo(d3); } while (dst < dst_end) { x = src[tmpsxloc >> shift]; tmpsxloc += sxinc; *dst++ = Gray2RGBx(x); } PTR_ADD(dstBase, dstScan); syloc += syinc; } } /***************************************************************/ void ADD_SUFF(IntArgbBmToIntRgbxXparOver)(BLIT_PARAMS) { mlib_s32 dstScan = pDstInfo->scanStride; mlib_s32 srcScan = pSrcInfo->scanStride; mlib_d64 dd, maskRGBx; mlib_s32 i, i0, j, mask; if (dstScan == 4*width && srcScan == 4*width) { width *= height; height = 1; } vis_alignaddr(NULL, 1); maskRGBx = vis_to_double_dup(0xFFFFFF00); for (j = 0; j < height; j++) { mlib_s32 *src = srcBase; mlib_s32 *dst = dstBase; i = i0 = 0; if ((mlib_s32)dst & 7) { if (*(mlib_u8*)(src + i)) { dst[i] = src[i] << 8; } i0 = 1; } #pragma pipeloop(0) for (i = i0; i <= (mlib_s32)width - 2; i += 2) { dd = vis_freg_pair(((mlib_s32*)src)[i], ((mlib_s32*)src)[i + 1]); dd = vis_fand(vis_faligndata(dd, dd), maskRGBx); mask = (((-*(mlib_u8*)(src + i)) >> 31) & 2) | (((-*(mlib_u8*)(src + i + 1)) >> 31) & 1); vis_pst_32(dd, dst + i, mask); } if (i < width) { if (*(mlib_u8*)(src + i)) { dst[i] = src[i] << 8; } } PTR_ADD(dstBase, dstScan); PTR_ADD(srcBase, srcScan); } } /***************************************************************/ void ADD_SUFF(IntArgbBmToIntRgbxScaleXparOver)(SCALE_PARAMS) { mlib_s32 dstScan = pDstInfo->scanStride; mlib_s32 srcScan = pSrcInfo->scanStride; mlib_d64 dd, maskRGBx; mlib_s32 j, mask; vis_alignaddr(NULL, 1); maskRGBx = vis_to_double_dup(0xFFFFFF00); for (j = 0; j < height; j++) { mlib_s32 *src = srcBase; mlib_s32 *dst = dstBase; mlib_s32 *dst_end = dst + width; mlib_s32 tmpsxloc = sxloc; PTR_ADD(src, (syloc >> shift) * srcScan); if ((mlib_s32)dst & 7) { mlib_s32 *pp = src + (tmpsxloc >> shift); if (*(mlib_u8*)pp) { *dst = *pp << 8; } dst++; tmpsxloc += sxinc; } #pragma pipeloop(0) for (; dst <= dst_end - 2; dst += 2) { mlib_s32 *pp0 = src + (tmpsxloc >> shift); mlib_s32 *pp1 = src + ((tmpsxloc + sxinc) >> shift); dd = vis_freg_pair(*(mlib_f32*)pp0, *(mlib_f32*)pp1); dd = vis_fand(vis_faligndata(dd, dd), maskRGBx); mask = (((-*(mlib_u8*)pp0) >> 31) & 2) | ((mlib_u32)(-*(mlib_u8*)pp1) >> 31); vis_pst_32(dd, dst, mask); tmpsxloc += 2*sxinc; } for (; dst < dst_end; dst++) { mlib_s32 *pp = src + (tmpsxloc >> shift); if (*(mlib_u8*)pp) { *dst = *pp << 8; } } PTR_ADD(dstBase, dstScan); syloc += syinc; } } /***************************************************************/ void ADD_SUFF(IntArgbBmToIntRgbxXparBgCopy)(BCOPY_PARAMS) { mlib_s32 dstScan = pDstInfo->scanStride; mlib_s32 srcScan = pSrcInfo->scanStride; mlib_d64 dd, d_bgpixel, maskRGBx; mlib_s32 i, i0, j, mask; if (dstScan == 4*width && srcScan == 4*width) { width *= height; height = 1; } vis_alignaddr(NULL, 1); d_bgpixel = vis_to_double_dup(bgpixel); maskRGBx = vis_to_double_dup(0xFFFFFF00); for (j = 0; j < height; j++) { mlib_s32 *src = srcBase; mlib_s32 *dst = dstBase; i = i0 = 0; if ((mlib_s32)dst & 7) { if (*(mlib_u8*)(src + i)) { dst[i] = src[i] << 8; } else { dst[i] = bgpixel; } i0 = 1; } #pragma pipeloop(0) for (i = i0; i <= (mlib_s32)width - 2; i += 2) { dd = vis_freg_pair(((mlib_s32*)src)[i], ((mlib_s32*)src)[i + 1]); dd = vis_fand(vis_faligndata(dd, dd), maskRGBx); mask = (((-*(mlib_u8*)(src + i)) >> 31) & 2) | (((-*(mlib_u8*)(src + i + 1)) >> 31) & 1); *(mlib_d64*)(dst + i) = d_bgpixel; vis_pst_32(dd, dst + i, mask); } if (i < width) { if (*(mlib_u8*)(src + i)) { dst[i] = src[i] << 8; } else { dst[i] = bgpixel; } } PTR_ADD(dstBase, dstScan); PTR_ADD(srcBase, srcScan); } } /***************************************************************/ void ADD_SUFF(ByteIndexedToIntRgbxConvert)(BLIT_PARAMS) { jint *pixLut = pSrcInfo->lutBase; mlib_s32 dstScan = pDstInfo->scanStride; mlib_s32 srcScan = pSrcInfo->scanStride; mlib_d64 dd, maskRGBx; mlib_s32 i, i0, j; if (srcScan == width && dstScan == 4*width) { width *= height; height = 1; } vis_alignaddr(NULL, 1); maskRGBx = vis_to_double_dup(0xFFFFFF00); for (j = 0; j < height; j++) { mlib_u8 *src = srcBase; mlib_s32 *dst = dstBase; i = i0 = 0; if ((mlib_s32)dst & 7) { dst[i] = pixLut[src[i]] << 8; i0 = 1; } #pragma pipeloop(0) for (i = i0; i <= (mlib_s32)width - 2; i += 2) { dd = vis_freg_pair(((mlib_f32*)pixLut)[src[i]], ((mlib_f32*)pixLut)[src[i + 1]]); dd = vis_fand(vis_faligndata(dd, dd), maskRGBx); *(mlib_d64*)(dst + i) = dd; } for (; i < width; i++) { dst[i] = pixLut[src[i]] << 8; } PTR_ADD(dstBase, dstScan); PTR_ADD(srcBase, srcScan); } } /***************************************************************/ void ADD_SUFF(ByteIndexedToIntRgbxScaleConvert)(SCALE_PARAMS) { jint *pixLut = pSrcInfo->lutBase; mlib_s32 dstScan = pDstInfo->scanStride; mlib_s32 srcScan = pSrcInfo->scanStride; mlib_d64 dd, maskRGBx; mlib_s32 j; vis_alignaddr(NULL, 1); maskRGBx = vis_to_double_dup(0xFFFFFF00); for (j = 0; j < height; j++) { mlib_u8 *src = srcBase; mlib_s32 *dst = dstBase; mlib_s32 *dst_end = dst + width; mlib_s32 tmpsxloc = sxloc; PTR_ADD(src, (syloc >> shift) * srcScan); if ((mlib_s32)dst & 7) { *dst++ = pixLut[src[tmpsxloc >> shift]] << 8; tmpsxloc += sxinc; } #pragma pipeloop(0) for (; dst <= dst_end - 2; dst += 2) { dd = LOAD_2F32(pixLut, src[tmpsxloc >> shift], src[(tmpsxloc + sxinc) >> shift]); dd = vis_fand(vis_faligndata(dd, dd), maskRGBx); *(mlib_d64*)dst = dd; tmpsxloc += 2*sxinc; } for (; dst < dst_end; dst++) { *dst = pixLut[src[tmpsxloc >> shift]] << 8; tmpsxloc += sxinc; } PTR_ADD(dstBase, dstScan); syloc += syinc; } } /***************************************************************/ void ADD_SUFF(ByteIndexedBmToIntRgbxXparOver)(BLIT_PARAMS) { jint *pixLut = pSrcInfo->lutBase; mlib_s32 dstScan = pDstInfo->scanStride; mlib_s32 srcScan = pSrcInfo->scanStride; mlib_d64 dd, maskRGBx; mlib_s32 i, i0, j, x, mask; if (srcScan == width && dstScan == 4*width) { width *= height; height = 1; } vis_alignaddr(NULL, 1); maskRGBx = vis_to_double_dup(0xFFFFFF00); for (j = 0; j < height; j++) { mlib_u8 *src = srcBase; mlib_s32 *dst = dstBase; i = i0 = 0; if ((mlib_s32)dst & 7) { x = pixLut[src[i]]; if (x < 0) { dst[i] = x << 8; } i0 = 1; } #pragma pipeloop(0) for (i = i0; i <= (mlib_s32)width - 2; i += 2) { mlib_f32 *pp0 = (mlib_f32*)pixLut + src[i]; mlib_f32 *pp1 = (mlib_f32*)pixLut + src[i + 1]; dd = vis_freg_pair(*pp0, *pp1); mask = (((*(mlib_u8*)pp0) >> 6) & 2) | ((*(mlib_u8*)pp1) >> 7); dd = vis_fand(vis_faligndata(dd, dd), maskRGBx); vis_pst_32(dd, dst + i, mask); } for (; i < width; i++) { x = pixLut[src[i]]; if (x < 0) { dst[i] = x << 8; } } PTR_ADD(dstBase, dstScan); PTR_ADD(srcBase, srcScan); } } /***************************************************************/ void ADD_SUFF(ByteIndexedBmToIntRgbxScaleXparOver)(SCALE_PARAMS) { jint *pixLut = pSrcInfo->lutBase; mlib_s32 dstScan = pDstInfo->scanStride; mlib_s32 srcScan = pSrcInfo->scanStride; mlib_d64 dd, maskRGBx; mlib_s32 j, x, mask; vis_alignaddr(NULL, 1); maskRGBx = vis_to_double_dup(0xFFFFFF00); for (j = 0; j < height; j++) { mlib_u8 *src = srcBase; mlib_s32 *dst = dstBase; mlib_s32 *dst_end = dst + width; mlib_s32 tmpsxloc = sxloc; PTR_ADD(src, (syloc >> shift) * srcScan); if ((mlib_s32)dst & 7) { x = pixLut[src[tmpsxloc >> shift]]; tmpsxloc += sxinc; if (x < 0) { *dst = x << 8; } dst++; } #pragma pipeloop(0) for (; dst <= dst_end - 2; dst += 2) { mlib_f32 *p0 = (mlib_f32*)pixLut + src[tmpsxloc >> shift]; mlib_f32 *p1 = (mlib_f32*)pixLut + src[(tmpsxloc + sxinc) >> shift]; dd = vis_freg_pair(*p0, *p1); mask = (((*(mlib_u8*)p0) >> 6) & 2) | ((*(mlib_u8*)p1) >> 7); dd = vis_fand(vis_faligndata(dd, dd), maskRGBx); tmpsxloc += 2*sxinc; vis_pst_32(dd, dst, mask); } for (; dst < dst_end; dst++) { x = pixLut[src[tmpsxloc >> shift]]; tmpsxloc += sxinc; if (x < 0) { *dst = x << 8; } } PTR_ADD(dstBase, dstScan); syloc += syinc; } } /***************************************************************/ void ADD_SUFF(ByteIndexedBmToIntRgbxXparBgCopy)(BCOPY_PARAMS) { jint *pixLut = pSrcInfo->lutBase; mlib_s32 dstScan = pDstInfo->scanStride; mlib_s32 srcScan = pSrcInfo->scanStride; mlib_d64 dd, d_bgpixel, maskRGBx; mlib_s32 j, x, mask; if (srcScan == width && dstScan == 4*width) { width *= height; height = 1; } vis_alignaddr(NULL, 1); maskRGBx = vis_to_double_dup(0xFFFFFF00); d_bgpixel = vis_to_double_dup(bgpixel); for (j = 0; j < height; j++) { mlib_u8 *src = srcBase; mlib_s32 *dst = dstBase; mlib_s32 *dst_end; dst_end = dst + width; if ((mlib_s32)dst & 7) { x = pixLut[*src++]; if (x < 0) { *dst = x << 8; } else { *dst = bgpixel; } dst++; } #pragma pipeloop(0) for (; dst <= (dst_end - 2); dst += 2) { mlib_f32 *pp0 = (mlib_f32*)pixLut + src[0]; mlib_f32 *pp1 = (mlib_f32*)pixLut + src[1]; dd = vis_freg_pair(*pp0, *pp1); mask = (((*(mlib_u8*)pp0) >> 6) & 2) | ((*(mlib_u8*)pp1) >> 7); dd = vis_fand(vis_faligndata(dd, dd), maskRGBx); *(mlib_d64*)dst = d_bgpixel; vis_pst_32(dd, dst, mask); src += 2; } while (dst < dst_end) { x = pixLut[*src++]; if (x < 0) { *dst = x << 8; } else { *dst = bgpixel; } dst++; } PTR_ADD(dstBase, dstScan); PTR_ADD(srcBase, srcScan); } } /***************************************************************/ void ADD_SUFF(IntRgbxDrawGlyphListAA)(GLYPH_LIST_PARAMS) { mlib_s32 glyphCounter; mlib_s32 scan = pRasInfo->scanStride; mlib_u8 *dstBase; mlib_s32 j; mlib_d64 dmix0, dmix1, dd, d0, d1, e0, e1, fgpixel_d; mlib_d64 done, done16, d_half, maskRGB, dzero; mlib_s32 pix, mask, mask_z; mlib_f32 srcG_f; done = vis_to_double_dup(0x7fff7fff); done16 = vis_to_double_dup(0x7fff); d_half = vis_to_double_dup((1 << (16 + 6)) | (1 << 6)); fgpixel_d = vis_to_double_dup(fgpixel); srcG_f = vis_to_float(argbcolor << 8); maskRGB = vis_to_double_dup(0xffffff00); dzero = vis_fzero(); vis_write_gsr(0 << 3); for (glyphCounter = 0; glyphCounter < totalGlyphs; glyphCounter++) { const jubyte *pixels; unsigned int rowBytes; int left, top; int width, height; int right, bottom; pixels = (const jubyte *) glyphs[glyphCounter].pixels; if (!pixels) continue; left = glyphs[glyphCounter].x; top = glyphs[glyphCounter].y; width = glyphs[glyphCounter].width; height = glyphs[glyphCounter].height; rowBytes = width; right = left + width; bottom = top + height; if (left < clipLeft) { pixels += clipLeft - left; left = clipLeft; } if (top < clipTop) { pixels += (clipTop - top) * rowBytes; top = clipTop; } if (right > clipRight) { right = clipRight; } if (bottom > clipBottom) { bottom = clipBottom; } if (right <= left || bottom <= top) { continue; } width = right - left; height = bottom - top; dstBase = pRasInfo->rasBase; PTR_ADD(dstBase, top*scan + 4*left); for (j = 0; j < height; j++) { mlib_u8 *src = (void*)pixels; mlib_s32 *dst, *dst_end; dst = (void*)dstBase; dst_end = dst + width; if ((mlib_s32)dst & 7) { pix = *src++; if (pix) { dd = vis_fpadd16(MUL8_VIS(srcG_f, pix), d_half); dd = vis_fpadd16(MUL8_VIS(*(mlib_f32*)dst, 255 - pix), dd); *(mlib_f32*)dst = vis_fands(vis_fpack16(dd), vis_read_hi(maskRGB)); if (pix == 255) *(mlib_f32*)dst = vis_read_hi(fgpixel_d); } dst++; } #pragma pipeloop(0) for (; dst <= (dst_end - 2); dst += 2) { dmix0 = vis_freg_pair(((mlib_f32 *)vis_mul8s_tbl)[src[0]], ((mlib_f32 *)vis_mul8s_tbl)[src[1]]); mask = vis_fcmplt32(dmix0, done16); mask_z = vis_fcmpne32(dmix0, dzero); dmix1 = vis_fpsub16(done, dmix0); src += 2; dd = *(mlib_d64*)dst; d0 = vis_fmul8x16al(srcG_f, vis_read_hi(dmix0)); d1 = vis_fmul8x16al(srcG_f, vis_read_lo(dmix0)); e0 = vis_fmul8x16al(vis_read_hi(dd), vis_read_hi(dmix1)); e1 = vis_fmul8x16al(vis_read_lo(dd), vis_read_lo(dmix1)); d0 = vis_fpadd16(vis_fpadd16(d0, d_half), e0); d1 = vis_fpadd16(vis_fpadd16(d1, d_half), e1); dd = vis_fpack16_pair(d0, d1); dd = vis_fand(dd, maskRGB); vis_pst_32(fgpixel_d, dst, mask_z); vis_pst_32(dd, dst, mask & mask_z); } while (dst < dst_end) { pix = *src++; if (pix) { dd = vis_fpadd16(MUL8_VIS(srcG_f, pix), d_half); dd = vis_fpadd16(MUL8_VIS(*(mlib_f32*)dst, 255 - pix), dd); *(mlib_f32*)dst = vis_fands(vis_fpack16(dd), vis_read_hi(maskRGB)); if (pix == 255) *(mlib_f32*)dst = vis_read_hi(fgpixel_d); } dst++; } PTR_ADD(dstBase, scan); pixels += rowBytes; } } } /***************************************************************/ #endif /* JAVA2D_NO_MLIB */