Path: blob/aarch64-shenandoah-jdk8u272-b10/jdk/src/solaris/native/sun/java2d/loops/vis_IntBgr.c
32288 views
/*1* Copyright (c) 2003, Oracle and/or its affiliates. All rights reserved.2* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.3*4* This code is free software; you can redistribute it and/or modify it5* under the terms of the GNU General Public License version 2 only, as6* published by the Free Software Foundation. Oracle designates this7* particular file as subject to the "Classpath" exception as provided8* by Oracle in the LICENSE file that accompanied this code.9*10* This code is distributed in the hope that it will be useful, but WITHOUT11* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or12* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License13* version 2 for more details (a copy is included in the LICENSE file that14* accompanied this code).15*16* You should have received a copy of the GNU General Public License version17* 2 along with this work; if not, write to the Free Software Foundation,18* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.19*20* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA21* or visit www.oracle.com if you need additional information or have any22* questions.23*/2425#if !defined(JAVA2D_NO_MLIB) || defined(MLIB_ADD_SUFF)2627#include "vis_AlphaMacros.h"2829/***************************************************************/3031#define ARGB_to_GBGR(x) \32(x << 16) | (x & 0xff00) | ((x >> 16) & 0xff)3334/***************************************************************/3536#define ARGB_to_BGR(x) \37((x << 16) & 0xff0000) | (x & 0xff00) | ((x >> 16) & 0xff)3839/***************************************************************/4041#define READ_Bgr(i) \42(src[3*i] << 16) | (src[3*i + 1] << 8) | src[3*i + 2]4344/***************************************************************/4546#define ARGB_to_GBGR_FL2(dst, src0, src1) { \47mlib_d64 t0, t1, t2; \48t0 = vis_fpmerge(src0, src1); \49t1 = vis_fpmerge(vis_read_lo(t0), vis_read_hi(t0)); \50t2 = vis_fpmerge(vis_read_lo(t0), vis_read_lo(t0)); \51dst = vis_fpmerge(vis_read_hi(t2), vis_read_lo(t1)); \52}5354/***************************************************************/5556#define ARGB_to_BGR_FL2(dst, src0, src1) { \57mlib_d64 t0, t1, t2; \58t0 = vis_fpmerge(src0, src1); \59t1 = vis_fpmerge(vis_read_lo(t0), vis_read_hi(t0)); \60t2 = vis_fpmerge(vis_fzeros(), vis_read_lo(t0)); \61dst = vis_fpmerge(vis_read_hi(t2), vis_read_lo(t1)); \62}6364/***************************************************************/6566void ADD_SUFF(IntBgrToIntArgbConvert)(BLIT_PARAMS)67{68mlib_s32 dstScan = pDstInfo->scanStride;69mlib_s32 srcScan = pSrcInfo->scanStride;70mlib_d64 dd, amask;71mlib_s32 i, i0, j, x;7273if (dstScan == 4*width && srcScan == 4*width) {74width *= height;75height = 1;76}7778amask = vis_to_double_dup(0xFF000000);79vis_alignaddr(NULL, 7);8081for (j = 0; j < height; j++) {82mlib_u32 *src = srcBase;83mlib_u32 *dst = dstBase;8485i = i0 = 0;8687if ((mlib_s32)dst & 7) {88x = src[i];89dst[i] = 0xff000000 | ARGB_to_GBGR(x);90i0 = 1;91}9293#pragma pipeloop(0)94for (i = i0; i <= (mlib_s32)width - 2; i += 2) {95ARGB2ABGR_FL2(dd, ((mlib_f32*)src)[i], ((mlib_f32*)src)[i + 1]);96*(mlib_d64*)(dst + i) = vis_for(dd, amask);97}9899if (i < width) {100x = src[i];101dst[i] = 0xff000000 | ARGB_to_GBGR(x);102}103104PTR_ADD(dstBase, dstScan);105PTR_ADD(srcBase, srcScan);106}107}108109/***************************************************************/110111void ADD_SUFF(IntBgrToIntArgbScaleConvert)(SCALE_PARAMS)112{113mlib_s32 dstScan = pDstInfo->scanStride;114mlib_s32 srcScan = pSrcInfo->scanStride;115mlib_d64 dd, amask;116mlib_s32 j, x;117118amask = vis_to_double_dup(0xFF000000);119vis_alignaddr(NULL, 7);120121for (j = 0; j < height; j++) {122mlib_u32 *src = srcBase;123mlib_u32 *dst = dstBase;124mlib_u32 *dst_end = dst + width;125mlib_s32 tmpsxloc = sxloc;126127PTR_ADD(src, (syloc >> shift) * srcScan);128129if ((mlib_s32)dst & 7) {130x = src[tmpsxloc >> shift];131*dst++ = 0xff000000 | ARGB_to_GBGR(x);132tmpsxloc += sxinc;133}134135#pragma pipeloop(0)136for (; dst <= dst_end - 2; dst += 2) {137ARGB2ABGR_FL2(dd, ((mlib_f32*)src)[tmpsxloc >> shift],138((mlib_f32*)src)[(tmpsxloc + sxinc) >> shift]);139*(mlib_d64*)dst = vis_for(dd, amask);140tmpsxloc += 2*sxinc;141}142143for (; dst < dst_end; dst++) {144x = src[tmpsxloc >> shift];145*dst++ = 0xff000000 | ARGB_to_GBGR(x);146tmpsxloc += sxinc;147}148149PTR_ADD(dstBase, dstScan);150syloc += syinc;151}152}153154/***************************************************************/155156void ADD_SUFF(IntArgbToIntBgrConvert)(BLIT_PARAMS)157{158mlib_s32 dstScan = pDstInfo->scanStride;159mlib_s32 srcScan = pSrcInfo->scanStride;160mlib_d64 dd;161mlib_s32 i, i0, j, x;162163if (dstScan == 4*width && srcScan == 4*width) {164width *= height;165height = 1;166}167168for (j = 0; j < height; j++) {169mlib_u32 *src = srcBase;170mlib_u32 *dst = dstBase;171172i = i0 = 0;173174if ((mlib_s32)dst & 7) {175x = src[i];176dst[i] = ARGB_to_GBGR(x);177i0 = 1;178}179180#pragma pipeloop(0)181for (i = i0; i <= (mlib_s32)width - 2; i += 2) {182ARGB_to_GBGR_FL2(dd, ((mlib_f32*)src)[i], ((mlib_f32*)src)[i + 1]);183*(mlib_d64*)(dst + i) = dd;184}185186if (i < width) {187x = src[i];188dst[i] = ARGB_to_GBGR(x);189}190191PTR_ADD(dstBase, dstScan);192PTR_ADD(srcBase, srcScan);193}194}195196/***************************************************************/197198void ADD_SUFF(IntArgbToIntBgrScaleConvert)(SCALE_PARAMS)199{200mlib_s32 dstScan = pDstInfo->scanStride;201mlib_s32 srcScan = pSrcInfo->scanStride;202mlib_d64 dd;203mlib_s32 j, x;204205for (j = 0; j < height; j++) {206mlib_u32 *src = srcBase;207mlib_u32 *dst = dstBase;208mlib_u32 *dst_end = dst + width;209mlib_s32 tmpsxloc = sxloc;210211PTR_ADD(src, (syloc >> shift) * srcScan);212213if ((mlib_s32)dst & 7) {214x = src[tmpsxloc >> shift];215*dst++ = ARGB_to_GBGR(x);216tmpsxloc += sxinc;217}218219#pragma pipeloop(0)220for (; dst <= dst_end - 2; dst += 2) {221ARGB_to_GBGR_FL2(dd, ((mlib_f32*)src)[tmpsxloc >> shift],222((mlib_f32*)src)[(tmpsxloc + sxinc) >> shift]);223*(mlib_d64*)dst = dd;224tmpsxloc += 2*sxinc;225}226227for (; dst < dst_end; dst++) {228x = src[tmpsxloc >> shift];229*dst++ = ARGB_to_GBGR(x);230tmpsxloc += sxinc;231}232233PTR_ADD(dstBase, dstScan);234syloc += syinc;235}236}237238/***************************************************************/239240#define INSERT_U8_34R { \241mlib_d64 sda, sdb, sdc, sdd; \242mlib_d64 sde, sdf, sdg, sdh; \243mlib_d64 sdi, sdj, sdk, sdl; \244mlib_d64 sdm; \245\246sda = vis_fpmerge(vis_read_hi(sd0), vis_read_lo(sd1)); \247sdb = vis_fpmerge(vis_read_lo(sd0), vis_read_hi(sd2)); \248sdc = vis_fpmerge(vis_read_hi(sd1), vis_read_lo(sd2)); \249sdd = vis_fpmerge(vis_read_hi(sda), vis_read_lo(sdb)); \250sde = vis_fpmerge(vis_read_lo(sda), vis_read_hi(sdc)); \251sdf = vis_fpmerge(vis_read_hi(sdb), vis_read_lo(sdc)); \252sdg = vis_fpmerge(vis_read_hi(sdd), vis_read_lo(sde)); \253sdh = vis_fpmerge(vis_read_lo(sdd), vis_read_hi(sdf)); \254sdi = vis_fpmerge(vis_read_hi(sde), vis_read_lo(sdf)); \255sdj = vis_fpmerge(vis_read_hi(sdg), vis_read_hi(sdi)); \256sdk = vis_fpmerge(vis_read_lo(sdg), vis_read_lo(sdi)); \257sdl = vis_fpmerge(vis_read_hi(sFF), vis_read_hi(sdh)); \258sdm = vis_fpmerge(vis_read_lo(sFF), vis_read_lo(sdh)); \259dd0 = vis_fpmerge(vis_read_hi(sdl), vis_read_hi(sdj)); \260dd1 = vis_fpmerge(vis_read_lo(sdl), vis_read_lo(sdj)); \261dd2 = vis_fpmerge(vis_read_hi(sdm), vis_read_hi(sdk)); \262dd3 = vis_fpmerge(vis_read_lo(sdm), vis_read_lo(sdk)); \263}264265/***************************************************************/266267void ADD_SUFF(ThreeByteBgrToIntBgrConvert)(BLIT_PARAMS)268{269mlib_s32 dstScan = pDstInfo->scanStride;270mlib_s32 srcScan = pSrcInfo->scanStride;271mlib_d64 *sp;272mlib_d64 sFF;273mlib_d64 s0, s1, s2, s3, sd0, sd1, sd2, dd0, dd1, dd2, dd3;274mlib_s32 i, i0, j;275276if (width < 16) {277for (j = 0; j < height; j++) {278mlib_u8 *src = srcBase;279mlib_u32 *dst = dstBase;280281for (i = 0; i < width; i++) {282dst[i] = READ_Bgr(i);283}284285PTR_ADD(dstBase, dstScan);286PTR_ADD(srcBase, srcScan);287}288return;289}290291if (srcScan == 3*width && dstScan == 4*width) {292width *= height;293height = 1;294}295296sFF = vis_fzero();297298for (j = 0; j < height; j++) {299mlib_u8 *src = srcBase;300mlib_f32 *dst = dstBase;301302i = i0 = 0;303304if ((mlib_s32)dst & 7) {305((mlib_s32*)dst)[i] = READ_Bgr(i);306i0 = 1;307}308309sp = vis_alignaddr(src, 3*i0);310s3 = *sp++;311312#pragma pipeloop(0)313for (i = i0; i <= (mlib_s32)width - 8; i += 8) {314s0 = s3;315s1 = *sp++;316s2 = *sp++;317s3 = *sp++;318sd0 = vis_faligndata(s0, s1);319sd1 = vis_faligndata(s1, s2);320sd2 = vis_faligndata(s2, s3);321322INSERT_U8_34R323324*(mlib_d64*)(dst + i ) = dd0;325*(mlib_d64*)(dst + i + 2) = dd1;326*(mlib_d64*)(dst + i + 4) = dd2;327*(mlib_d64*)(dst + i + 6) = dd3;328}329330for (; i < width; i++) {331((mlib_s32*)dst)[i] = READ_Bgr(i);332}333334PTR_ADD(dstBase, dstScan);335PTR_ADD(srcBase, srcScan);336}337}338339/***************************************************************/340341void ADD_SUFF(ThreeByteBgrToIntBgrScaleConvert)(SCALE_PARAMS)342{343mlib_s32 dstScan = pDstInfo->scanStride;344mlib_s32 srcScan = pSrcInfo->scanStride;345mlib_d64 dd, dzero;346mlib_s32 i, i0, i1, j;347348if (width < 16) {349for (j = 0; j < height; j++) {350mlib_u8 *src = srcBase;351mlib_s32 *dst = dstBase;352mlib_s32 *dst_end = dst + width;353mlib_s32 tmpsxloc = sxloc;354355PTR_ADD(src, (syloc >> shift) * srcScan);356357for (; dst < dst_end; dst++) {358i = tmpsxloc >> shift;359tmpsxloc += sxinc;360*(mlib_s32*)dst = READ_Bgr(i);361}362363PTR_ADD(dstBase, dstScan);364syloc += syinc;365}366return;367}368369dzero = vis_fzero();370371vis_alignaddr(NULL, 7);372373for (j = 0; j < height; j++) {374mlib_u8 *src = srcBase;375mlib_f32 *dst = dstBase;376mlib_f32 *dst_end = dst + width;377mlib_s32 tmpsxloc = sxloc;378379PTR_ADD(src, (syloc >> shift) * srcScan);380381if ((mlib_s32)dst & 7) {382i = tmpsxloc >> shift;383tmpsxloc += sxinc;384*(mlib_s32*)dst = READ_Bgr(i);385dst++;386}387388#pragma pipeloop(0)389for (; dst <= dst_end - 2; dst += 2) {390i0 = tmpsxloc >> shift;391i1 = (tmpsxloc + sxinc) >> shift;392tmpsxloc += 2*sxinc;393394dd = vis_faligndata(vis_ld_u8(src + 3*i1 + 2), dd);395dd = vis_faligndata(vis_ld_u8(src + 3*i1 + 1), dd);396dd = vis_faligndata(vis_ld_u8(src + 3*i1 ), dd);397dd = vis_faligndata(dzero, dd);398dd = vis_faligndata(vis_ld_u8(src + 3*i0 + 2), dd);399dd = vis_faligndata(vis_ld_u8(src + 3*i0 + 1), dd);400dd = vis_faligndata(vis_ld_u8(src + 3*i0 ), dd);401dd = vis_faligndata(dzero, dd);402403*(mlib_d64*)dst = dd;404}405406for (; dst < dst_end; dst++) {407i = tmpsxloc >> shift;408tmpsxloc += sxinc;409*(mlib_s32*)dst = READ_Bgr(i);410}411412PTR_ADD(dstBase, dstScan);413syloc += syinc;414}415}416417/***************************************************************/418419void ADD_SUFF(IntArgbBmToIntBgrXparOver)(BLIT_PARAMS)420{421mlib_s32 dstScan = pDstInfo->scanStride;422mlib_s32 srcScan = pSrcInfo->scanStride;423mlib_d64 dd;424mlib_s32 i, i0, j, mask, x;425426if (dstScan == 4*width && srcScan == 4*width) {427width *= height;428height = 1;429}430431for (j = 0; j < height; j++) {432mlib_s32 *src = srcBase;433mlib_s32 *dst = dstBase;434435i = i0 = 0;436437if ((mlib_s32)dst & 7) {438if (*(mlib_u8*)(src + i)) {439x = src[i];440dst[i] = ARGB_to_GBGR(x);441}442i0 = 1;443}444445#pragma pipeloop(0)446for (i = i0; i <= (mlib_s32)width - 2; i += 2) {447ARGB_to_GBGR_FL2(dd, ((mlib_f32*)src)[i], ((mlib_f32*)src)[i + 1]);448mask = (((-*(mlib_u8*)(src + i)) >> 31) & 2) |449(((-*(mlib_u8*)(src + i + 1)) >> 31) & 1);450vis_pst_32(dd, dst + i, mask);451}452453if (i < width) {454if (*(mlib_u8*)(src + i)) {455x = src[i];456dst[i] = ARGB_to_GBGR(x);457}458}459460PTR_ADD(dstBase, dstScan);461PTR_ADD(srcBase, srcScan);462}463}464465/***************************************************************/466467void ADD_SUFF(IntArgbBmToIntBgrScaleXparOver)(SCALE_PARAMS)468{469mlib_s32 dstScan = pDstInfo->scanStride;470mlib_s32 srcScan = pSrcInfo->scanStride;471mlib_d64 dd;472mlib_s32 j, mask;473474for (j = 0; j < height; j++) {475mlib_s32 *src = srcBase;476mlib_s32 *dst = dstBase;477mlib_s32 *dst_end = dst + width;478mlib_s32 tmpsxloc = sxloc;479480PTR_ADD(src, (syloc >> shift) * srcScan);481482if ((mlib_s32)dst & 7) {483mlib_s32 *pp = src + (tmpsxloc >> shift);484if (*(mlib_u8*)pp) {485*dst = ARGB_to_GBGR(*pp);486}487dst++;488tmpsxloc += sxinc;489}490491#pragma pipeloop(0)492for (; dst <= dst_end - 2; dst += 2) {493mlib_s32 *pp0 = src + (tmpsxloc >> shift);494mlib_s32 *pp1 = src + ((tmpsxloc + sxinc) >> shift);495ARGB_to_GBGR_FL2(dd, *(mlib_f32*)pp0, *(mlib_f32*)pp1);496mask = (((-*(mlib_u8*)pp0) >> 31) & 2) |497((mlib_u32)(-*(mlib_u8*)pp1) >> 31);498vis_pst_32(dd, dst, mask);499tmpsxloc += 2*sxinc;500}501502for (; dst < dst_end; dst++) {503mlib_s32 *pp = src + (tmpsxloc >> shift);504if (*(mlib_u8*)pp) {505*dst = ARGB_to_GBGR(*pp);506}507}508509PTR_ADD(dstBase, dstScan);510syloc += syinc;511}512}513514/***************************************************************/515516void ADD_SUFF(IntArgbBmToIntBgrXparBgCopy)(BCOPY_PARAMS)517{518mlib_s32 dstScan = pDstInfo->scanStride;519mlib_s32 srcScan = pSrcInfo->scanStride;520mlib_d64 dd, d_bgpixel;521mlib_s32 i, i0, j, mask;522523if (dstScan == 4*width && srcScan == 4*width) {524width *= height;525height = 1;526}527528vis_alignaddr(NULL, 1);529d_bgpixel = vis_to_double_dup(bgpixel);530531for (j = 0; j < height; j++) {532mlib_s32 *src = srcBase;533mlib_s32 *dst = dstBase;534535i = i0 = 0;536537if ((mlib_s32)dst & 7) {538if (*(mlib_u8*)(src + i)) {539dst[i] = ARGB_to_GBGR(src[i]);540} else {541dst[i] = bgpixel;542}543i0 = 1;544}545546#pragma pipeloop(0)547for (i = i0; i <= (mlib_s32)width - 2; i += 2) {548ARGB_to_GBGR_FL2(dd, ((mlib_f32*)src)[i], ((mlib_f32*)src)[i + 1]);549mask = (((-*(mlib_u8*)(src + i)) >> 31) & 2) |550(((-*(mlib_u8*)(src + i + 1)) >> 31) & 1);551*(mlib_d64*)(dst + i) = d_bgpixel;552vis_pst_32(dd, dst + i, mask);553}554555if (i < width) {556if (*(mlib_u8*)(src + i)) {557dst[i] = ARGB_to_GBGR(src[i]);558} else {559dst[i] = bgpixel;560}561}562563PTR_ADD(dstBase, dstScan);564PTR_ADD(srcBase, srcScan);565}566}567568/***************************************************************/569570void ADD_SUFF(ByteIndexedToIntBgrConvert)(BLIT_PARAMS)571{572jint *pixLut = pSrcInfo->lutBase;573mlib_s32 dstScan = pDstInfo->scanStride;574mlib_s32 srcScan = pSrcInfo->scanStride;575mlib_d64 dd;576mlib_s32 i, i0, j, x;577578if (srcScan == width && dstScan == 4*width) {579width *= height;580height = 1;581}582583for (j = 0; j < height; j++) {584mlib_u8 *src = srcBase;585mlib_s32 *dst = dstBase;586587i = i0 = 0;588589if ((mlib_s32)dst & 7) {590x = pixLut[src[i]];591dst[i] = ARGB_to_GBGR(x);592i0 = 1;593}594595#pragma pipeloop(0)596for (i = i0; i <= (mlib_s32)width - 2; i += 2) {597ARGB_to_GBGR_FL2(dd, ((mlib_f32*)pixLut)[src[i]],598((mlib_f32*)pixLut)[src[i + 1]]);599*(mlib_d64*)(dst + i) = dd;600}601602for (; i < width; i++) {603x = pixLut[src[i]];604dst[i] = ARGB_to_GBGR(x);605}606607PTR_ADD(dstBase, dstScan);608PTR_ADD(srcBase, srcScan);609}610}611612/***************************************************************/613614void ADD_SUFF(ByteIndexedToIntBgrScaleConvert)(SCALE_PARAMS)615{616jint *pixLut = pSrcInfo->lutBase;617mlib_s32 dstScan = pDstInfo->scanStride;618mlib_s32 srcScan = pSrcInfo->scanStride;619mlib_d64 dd;620mlib_s32 j, x;621622for (j = 0; j < height; j++) {623mlib_u8 *src = srcBase;624mlib_s32 *dst = dstBase;625mlib_s32 *dst_end = dst + width;626mlib_s32 tmpsxloc = sxloc;627628PTR_ADD(src, (syloc >> shift) * srcScan);629630if ((mlib_s32)dst & 7) {631x = pixLut[src[tmpsxloc >> shift]];632*dst++ = ARGB_to_GBGR(x);633tmpsxloc += sxinc;634}635636#pragma pipeloop(0)637for (; dst <= dst_end - 2; dst += 2) {638mlib_f32 f0 = ((mlib_f32*)pixLut)[src[tmpsxloc >> shift]];639mlib_f32 f1 = ((mlib_f32*)pixLut)[src[(tmpsxloc + sxinc) >> shift]];640ARGB_to_GBGR_FL2(dd, f0, f1);641*(mlib_d64*)dst = dd;642tmpsxloc += 2*sxinc;643}644645for (; dst < dst_end; dst++) {646x = pixLut[src[tmpsxloc >> shift]];647*dst++ = ARGB_to_GBGR(x);648tmpsxloc += sxinc;649}650651PTR_ADD(dstBase, dstScan);652syloc += syinc;653}654}655656/***************************************************************/657658void ADD_SUFF(ByteIndexedBmToIntBgrXparOver)(BLIT_PARAMS)659{660jint *pixLut = pSrcInfo->lutBase;661mlib_s32 dstScan = pDstInfo->scanStride;662mlib_s32 srcScan = pSrcInfo->scanStride;663mlib_d64 dd;664mlib_s32 i, i0, j, x, mask;665666if (srcScan == width && dstScan == 4*width) {667width *= height;668height = 1;669}670671for (j = 0; j < height; j++) {672mlib_u8 *src = srcBase;673mlib_s32 *dst = dstBase;674675i = i0 = 0;676677if ((mlib_s32)dst & 7) {678x = pixLut[src[i]];679if (x < 0) {680dst[i] = ARGB_to_BGR(x);681}682i0 = 1;683}684685#pragma pipeloop(0)686for (i = i0; i <= (mlib_s32)width - 2; i += 2) {687mlib_f32 *pp0 = (mlib_f32*)pixLut + src[i];688mlib_f32 *pp1 = (mlib_f32*)pixLut + src[i + 1];689ARGB_to_BGR_FL2(dd, *pp0, *pp1);690mask = (((*(mlib_u8*)pp0) >> 6) & 2) | ((*(mlib_u8*)pp1) >> 7);691vis_pst_32(dd, dst + i, mask);692}693694for (; i < width; i++) {695x = pixLut[src[i]];696if (x < 0) {697dst[i] = ARGB_to_BGR(x);698}699}700701PTR_ADD(dstBase, dstScan);702PTR_ADD(srcBase, srcScan);703}704}705706/***************************************************************/707708void ADD_SUFF(ByteIndexedBmToIntBgrScaleXparOver)(SCALE_PARAMS)709{710jint *pixLut = pSrcInfo->lutBase;711mlib_s32 dstScan = pDstInfo->scanStride;712mlib_s32 srcScan = pSrcInfo->scanStride;713mlib_d64 dd;714mlib_s32 j, x, mask;715716for (j = 0; j < height; j++) {717mlib_u8 *src = srcBase;718mlib_s32 *dst = dstBase;719mlib_s32 *dst_end = dst + width;720mlib_s32 tmpsxloc = sxloc;721722PTR_ADD(src, (syloc >> shift) * srcScan);723724if ((mlib_s32)dst & 7) {725x = pixLut[src[tmpsxloc >> shift]];726tmpsxloc += sxinc;727if (x < 0) {728*dst = ARGB_to_BGR(x);729}730dst++;731}732733#pragma pipeloop(0)734for (; dst <= dst_end - 2; dst += 2) {735mlib_f32 *p0 = (mlib_f32*)pixLut + src[tmpsxloc >> shift];736mlib_f32 *p1 = (mlib_f32*)pixLut + src[(tmpsxloc + sxinc) >> shift];737ARGB_to_BGR_FL2(dd, *p0, *p1);738mask = (((*(mlib_u8*)p0) >> 6) & 2) | ((*(mlib_u8*)p1) >> 7);739tmpsxloc += 2*sxinc;740vis_pst_32(dd, dst, mask);741}742743for (; dst < dst_end; dst++) {744x = pixLut[src[tmpsxloc >> shift]];745tmpsxloc += sxinc;746if (x < 0) {747*dst = ARGB_to_BGR(x);748}749}750751PTR_ADD(dstBase, dstScan);752syloc += syinc;753}754}755756/***************************************************************/757758void ADD_SUFF(ByteIndexedBmToIntBgrXparBgCopy)(BCOPY_PARAMS)759{760jint *pixLut = pSrcInfo->lutBase;761mlib_s32 dstScan = pDstInfo->scanStride;762mlib_s32 srcScan = pSrcInfo->scanStride;763mlib_d64 dd, d_bgpixel;764mlib_s32 j, x, mask;765766if (srcScan == width && dstScan == 4*width) {767width *= height;768height = 1;769}770771d_bgpixel = vis_to_double_dup(bgpixel);772773for (j = 0; j < height; j++) {774mlib_u8 *src = srcBase;775mlib_s32 *dst = dstBase;776mlib_s32 *dst_end;777778dst_end = dst + width;779780if ((mlib_s32)dst & 7) {781x = pixLut[*src++];782if (x < 0) {783*dst = ARGB_to_GBGR(x);784} else {785*dst = bgpixel;786}787dst++;788}789790#pragma pipeloop(0)791for (; dst <= (dst_end - 2); dst += 2) {792mlib_f32 *pp0 = (mlib_f32*)pixLut + src[0];793mlib_f32 *pp1 = (mlib_f32*)pixLut + src[1];794ARGB_to_GBGR_FL2(dd, *pp0, *pp1);795mask = (((*(mlib_u8*)pp0) >> 6) & 2) | ((*(mlib_u8*)pp1) >> 7);796*(mlib_d64*)dst = d_bgpixel;797vis_pst_32(dd, dst, mask);798src += 2;799}800801while (dst < dst_end) {802x = pixLut[*src++];803if (x < 0) {804*dst = ARGB_to_GBGR(x);805} else {806*dst = bgpixel;807}808dst++;809}810811PTR_ADD(dstBase, dstScan);812PTR_ADD(srcBase, srcScan);813}814}815816/***************************************************************/817818void ADD_SUFF(IntBgrDrawGlyphListAA)(GLYPH_LIST_PARAMS)819{820mlib_s32 glyphCounter;821mlib_s32 scan = pRasInfo->scanStride;822mlib_u8 *dstBase;823mlib_s32 j;824mlib_d64 dmix0, dmix1, dd, d0, d1, e0, e1, fgpixel_d;825mlib_d64 done, done16, d_half, maskRGB, dzero;826mlib_s32 pix, mask, mask_z;827mlib_f32 srcG_f;828829done = vis_to_double_dup(0x7fff7fff);830done16 = vis_to_double_dup(0x7fff);831d_half = vis_to_double_dup((1 << (16 + 6)) | (1 << 6));832833fgpixel_d = vis_to_double_dup(fgpixel);834srcG_f = vis_to_float(argbcolor);835maskRGB = vis_to_double_dup(0xffffff);836dzero = vis_fzero();837838ARGB2ABGR_FL(srcG_f)839840vis_write_gsr(0 << 3);841842for (glyphCounter = 0; glyphCounter < totalGlyphs; glyphCounter++) {843const jubyte *pixels;844unsigned int rowBytes;845int left, top;846int width, height;847int right, bottom;848849pixels = (const jubyte *) glyphs[glyphCounter].pixels;850851if (!pixels) continue;852853left = glyphs[glyphCounter].x;854top = glyphs[glyphCounter].y;855width = glyphs[glyphCounter].width;856height = glyphs[glyphCounter].height;857rowBytes = width;858right = left + width;859bottom = top + height;860if (left < clipLeft) {861pixels += clipLeft - left;862left = clipLeft;863}864if (top < clipTop) {865pixels += (clipTop - top) * rowBytes;866top = clipTop;867}868if (right > clipRight) {869right = clipRight;870}871if (bottom > clipBottom) {872bottom = clipBottom;873}874if (right <= left || bottom <= top) {875continue;876}877width = right - left;878height = bottom - top;879880dstBase = pRasInfo->rasBase;881PTR_ADD(dstBase, top*scan + 4*left);882883for (j = 0; j < height; j++) {884mlib_u8 *src = (void*)pixels;885mlib_s32 *dst, *dst_end;886887dst = (void*)dstBase;888dst_end = dst + width;889890if ((mlib_s32)dst & 7) {891pix = *src++;892if (pix) {893dd = vis_fpadd16(MUL8_VIS(srcG_f, pix), d_half);894dd = vis_fpadd16(MUL8_VIS(*(mlib_f32*)dst, 255 - pix), dd);895*(mlib_f32*)dst = vis_fands(vis_fpack16(dd),896vis_read_hi(maskRGB));897if (pix == 255) *(mlib_f32*)dst = vis_read_hi(fgpixel_d);898}899dst++;900}901902#pragma pipeloop(0)903for (; dst <= (dst_end - 2); dst += 2) {904dmix0 = vis_freg_pair(((mlib_f32 *)vis_mul8s_tbl)[src[0]],905((mlib_f32 *)vis_mul8s_tbl)[src[1]]);906mask = vis_fcmplt32(dmix0, done16);907mask_z = vis_fcmpne32(dmix0, dzero);908dmix1 = vis_fpsub16(done, dmix0);909src += 2;910911dd = *(mlib_d64*)dst;912d0 = vis_fmul8x16al(srcG_f, vis_read_hi(dmix0));913d1 = vis_fmul8x16al(srcG_f, vis_read_lo(dmix0));914e0 = vis_fmul8x16al(vis_read_hi(dd), vis_read_hi(dmix1));915e1 = vis_fmul8x16al(vis_read_lo(dd), vis_read_lo(dmix1));916d0 = vis_fpadd16(vis_fpadd16(d0, d_half), e0);917d1 = vis_fpadd16(vis_fpadd16(d1, d_half), e1);918dd = vis_fpack16_pair(d0, d1);919dd = vis_fand(dd, maskRGB);920921vis_pst_32(fgpixel_d, dst, mask_z);922vis_pst_32(dd, dst, mask & mask_z);923}924925while (dst < dst_end) {926pix = *src++;927if (pix) {928dd = vis_fpadd16(MUL8_VIS(srcG_f, pix), d_half);929dd = vis_fpadd16(MUL8_VIS(*(mlib_f32*)dst, 255 - pix), dd);930*(mlib_f32*)dst = vis_fands(vis_fpack16(dd),931vis_read_hi(maskRGB));932if (pix == 255) *(mlib_f32*)dst = vis_read_hi(fgpixel_d);933}934dst++;935}936937PTR_ADD(dstBase, scan);938pixels += rowBytes;939}940}941}942943/***************************************************************/944945#endif /* JAVA2D_NO_MLIB */946947948