934 lines
23 KiB
C
934 lines
23 KiB
C
|
/*
|
||
|
* cfb copy area
|
||
|
*/
|
||
|
|
||
|
/*
|
||
|
|
||
|
Copyright 1989, 1998 The Open Group
|
||
|
|
||
|
Permission to use, copy, modify, distribute, and sell this software and its
|
||
|
documentation for any purpose is hereby granted without fee, provided that
|
||
|
the above copyright notice appear in all copies and that both that
|
||
|
copyright notice and this permission notice appear in supporting
|
||
|
documentation.
|
||
|
|
||
|
The above copyright notice and this permission notice shall be included in
|
||
|
all copies or substantial portions of the Software.
|
||
|
|
||
|
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
||
|
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
||
|
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
||
|
OPEN GROUP BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN
|
||
|
AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
|
||
|
CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|
||
|
|
||
|
Except as contained in this notice, the name of The Open Group shall not be
|
||
|
used in advertising or otherwise to promote the sale, use or other dealings
|
||
|
in this Software without prior written authorization from The Open Group.
|
||
|
|
||
|
Author: Keith Packard
|
||
|
|
||
|
*/
|
||
|
|
||
|
/* 24-bit bug fixes: Peter Wainwright, 1998/11/28 */
|
||
|
|
||
|
#ifdef HAVE_DIX_CONFIG_H
|
||
|
#include <dix-config.h>
|
||
|
#endif
|
||
|
|
||
|
#include <stdlib.h>
|
||
|
|
||
|
#include <X11/X.h>
|
||
|
#include <X11/Xmd.h>
|
||
|
#include <X11/Xproto.h>
|
||
|
#include "gcstruct.h"
|
||
|
#include "windowstr.h"
|
||
|
#include "scrnintstr.h"
|
||
|
#include "pixmapstr.h"
|
||
|
#include "regionstr.h"
|
||
|
#include "cfb.h"
|
||
|
#include "cfbmskbits.h"
|
||
|
#include "cfb8bit.h"
|
||
|
#include "fastblt.h"
|
||
|
#include "mergerop.h"
|
||
|
|
||
|
#ifdef notdef /* XXX fails right now, walks off end of pixmaps */
|
||
|
#if defined (FAST_UNALIGNED_READS) && PSZ == 8
|
||
|
#define DO_UNALIGNED_BITBLT
|
||
|
#endif
|
||
|
#endif
|
||
|
|
||
|
#if defined(FAST_MEMCPY) && (MROP == Mcopy) && PSZ == 8
|
||
|
#define DO_MEMCPY
|
||
|
#endif
|
||
|
|
||
|
/* ................................................. */
|
||
|
/* SPECIAL CODE FOR 24 BITS by Peter Wainwright */
|
||
|
|
||
|
#if PSZ == 24 && (MROP) == 0
|
||
|
|
||
|
/* The default macros are defined in mergerop.h, and none of them are
|
||
|
really appropriate for what we want to do.
|
||
|
|
||
|
There are two ways of fixing this: either define SLOW_24BIT_COPY
|
||
|
to copy pixel by pixel, or (by default) use the following macros
|
||
|
modified from mergerop.h
|
||
|
|
||
|
MROP_SOLID and MROP_MASK are defined for each of the operations,
|
||
|
i.e. each value of MROP.
|
||
|
|
||
|
There are special cases for Mcopy, McopyInverted, Mxor, and Mor.
|
||
|
There is a completely generic version for MROP=0, and a simplified
|
||
|
generic version which works for (Mcopy|Mxor|MandReverse|Mor).
|
||
|
|
||
|
However, the generic version does not work for the 24-bit case
|
||
|
because the pixels cannot be packed exactly into a machine word (32
|
||
|
bits).
|
||
|
|
||
|
Alternative macros MROP_SOLID24 and MROP_MASK24 are provided for
|
||
|
the 24-bit case. However, these each copy a single *pixel*, not a
|
||
|
single machine word. They take an rvalue source pixel, an lvalue
|
||
|
destination, and the pixel index. The latter is used to find the
|
||
|
position of the pixel data within the two words *dst and *(dst+1).
|
||
|
|
||
|
Further macros MROP_SOLID24P and MROP_MASK24P are used to copy from
|
||
|
an lvalue source to an lvalue destination. MROP_PIXEL24 is used to
|
||
|
assemble the source pixel from the adjacent words *src and
|
||
|
*(src+1), and this is then split between the destination words
|
||
|
using the non-P macros above.
|
||
|
|
||
|
But we want to copy entire words for the sake of efficiency.
|
||
|
Unfortunately if a plane mask is specified this must be shifted
|
||
|
from one word to the next. Fortunately the pattern repeats after 3
|
||
|
words, so we unroll the planemask here and redefine MROP_SOLID
|
||
|
and MROP_MASK. */
|
||
|
|
||
|
|
||
|
#endif /* MROP == 0 && PSZ == 24 */
|
||
|
|
||
|
/* ................................................. */
|
||
|
|
||
|
#if PSZ == 24
|
||
|
#define BYPP 3
|
||
|
#if PGSZ == 32
|
||
|
#define P3W 4 /* pixels in 3 machine words */
|
||
|
#define PAM 3 /* pixel align mask; PAM = P3W -1 */
|
||
|
#define P2WSH 2
|
||
|
#else
|
||
|
#define P3W 8 /* pixels in 3 machine words */
|
||
|
#define PAM 7 /* pixel align mask; PAM = P3W -1 */
|
||
|
#define P2WSH 3
|
||
|
#endif
|
||
|
#endif
|
||
|
|
||
|
void
|
||
|
MROP_NAME(cfbDoBitblt)(
|
||
|
DrawablePtr pSrc,
|
||
|
DrawablePtr pDst,
|
||
|
int alu,
|
||
|
RegionPtr prgnDst,
|
||
|
DDXPointPtr pptSrc,
|
||
|
unsigned long planemask)
|
||
|
{
|
||
|
CfbBits *psrcBase, *pdstBase;
|
||
|
/* start of src and dst bitmaps */
|
||
|
int widthSrc, widthDst; /* add to get to same position in next line */
|
||
|
|
||
|
BoxPtr pbox;
|
||
|
int nbox;
|
||
|
|
||
|
BoxPtr pboxTmp, pboxNext, pboxBase, pboxNew1, pboxNew2;
|
||
|
/* temporaries for shuffling rectangles */
|
||
|
DDXPointPtr pptTmp, pptNew1, pptNew2;
|
||
|
/* shuffling boxes entails shuffling the
|
||
|
source points too */
|
||
|
int w, h;
|
||
|
int xdir; /* 1 = left right, -1 = right left/ */
|
||
|
int ydir; /* 1 = top down, -1 = bottom up */
|
||
|
|
||
|
CfbBits *psrcLine, *pdstLine;
|
||
|
/* pointers to line with current src and dst */
|
||
|
register CfbBits *psrc;/* pointer to current src longword */
|
||
|
register CfbBits *pdst;/* pointer to current dst longword */
|
||
|
|
||
|
MROP_DECLARE_REG()
|
||
|
|
||
|
/* following used for looping through a line */
|
||
|
CfbBits startmask, endmask; /* masks for writing ends of dst */
|
||
|
int nlMiddle; /* whole longwords in dst */
|
||
|
int xoffSrc, xoffDst;
|
||
|
register int nl; /* temp copy of nlMiddle */
|
||
|
int careful;
|
||
|
|
||
|
#if (PSZ != 24) || (MROP != 0)
|
||
|
register int leftShift, rightShift;
|
||
|
register CfbBits bits;
|
||
|
register CfbBits bits1;
|
||
|
#endif
|
||
|
|
||
|
#if PSZ == 24
|
||
|
#ifdef DO_MEMCPY
|
||
|
int w2;
|
||
|
#endif
|
||
|
|
||
|
#if MROP == 0
|
||
|
int widthSrcBytes = cfbGetByteWidth(pSrc);
|
||
|
int widthDstBytes = cfbGetByteWidth(pDst);
|
||
|
#endif
|
||
|
#endif
|
||
|
|
||
|
MROP_INITIALIZE(alu,planemask)
|
||
|
|
||
|
cfbGetLongWidthAndPointer (pSrc, widthSrc, psrcBase)
|
||
|
|
||
|
cfbGetLongWidthAndPointer (pDst, widthDst, pdstBase)
|
||
|
|
||
|
/* XXX we have to err on the side of safety when both are windows,
|
||
|
* because we don't know if IncludeInferiors is being used.
|
||
|
*/
|
||
|
careful = ((pSrc == pDst) ||
|
||
|
((pSrc->type == DRAWABLE_WINDOW) &&
|
||
|
(pDst->type == DRAWABLE_WINDOW)));
|
||
|
|
||
|
pbox = REGION_RECTS(prgnDst);
|
||
|
nbox = REGION_NUM_RECTS(prgnDst);
|
||
|
|
||
|
pboxNew1 = NULL;
|
||
|
pptNew1 = NULL;
|
||
|
pboxNew2 = NULL;
|
||
|
pptNew2 = NULL;
|
||
|
if (careful && (pptSrc->y < pbox->y1))
|
||
|
{
|
||
|
/* walk source botttom to top */
|
||
|
ydir = -1;
|
||
|
widthSrc = -widthSrc;
|
||
|
widthDst = -widthDst;
|
||
|
|
||
|
if (nbox > 1)
|
||
|
{
|
||
|
/* keep ordering in each band, reverse order of bands */
|
||
|
pboxNew1 = (BoxPtr)ALLOCATE_LOCAL(sizeof(BoxRec) * nbox);
|
||
|
if(!pboxNew1)
|
||
|
return;
|
||
|
pptNew1 = (DDXPointPtr)ALLOCATE_LOCAL(sizeof(DDXPointRec) * nbox);
|
||
|
if(!pptNew1)
|
||
|
{
|
||
|
DEALLOCATE_LOCAL(pboxNew1);
|
||
|
return;
|
||
|
}
|
||
|
pboxBase = pboxNext = pbox+nbox-1;
|
||
|
while (pboxBase >= pbox)
|
||
|
{
|
||
|
while ((pboxNext >= pbox) &&
|
||
|
(pboxBase->y1 == pboxNext->y1))
|
||
|
pboxNext--;
|
||
|
pboxTmp = pboxNext+1;
|
||
|
pptTmp = pptSrc + (pboxTmp - pbox);
|
||
|
while (pboxTmp <= pboxBase)
|
||
|
{
|
||
|
*pboxNew1++ = *pboxTmp++;
|
||
|
*pptNew1++ = *pptTmp++;
|
||
|
}
|
||
|
pboxBase = pboxNext;
|
||
|
}
|
||
|
pboxNew1 -= nbox;
|
||
|
pbox = pboxNew1;
|
||
|
pptNew1 -= nbox;
|
||
|
pptSrc = pptNew1;
|
||
|
}
|
||
|
}
|
||
|
else
|
||
|
{
|
||
|
/* walk source top to bottom */
|
||
|
ydir = 1;
|
||
|
}
|
||
|
|
||
|
if (careful && (pptSrc->x < pbox->x1))
|
||
|
{
|
||
|
/* walk source right to left */
|
||
|
xdir = -1;
|
||
|
|
||
|
if (nbox > 1)
|
||
|
{
|
||
|
/* reverse order of rects in each band */
|
||
|
pboxNew2 = (BoxPtr)ALLOCATE_LOCAL(sizeof(BoxRec) * nbox);
|
||
|
pptNew2 = (DDXPointPtr)ALLOCATE_LOCAL(sizeof(DDXPointRec) * nbox);
|
||
|
if(!pboxNew2 || !pptNew2)
|
||
|
{
|
||
|
if (pptNew2) DEALLOCATE_LOCAL(pptNew2);
|
||
|
if (pboxNew2) DEALLOCATE_LOCAL(pboxNew2);
|
||
|
if (pboxNew1)
|
||
|
{
|
||
|
DEALLOCATE_LOCAL(pptNew1);
|
||
|
DEALLOCATE_LOCAL(pboxNew1);
|
||
|
}
|
||
|
return;
|
||
|
}
|
||
|
pboxBase = pboxNext = pbox;
|
||
|
while (pboxBase < pbox+nbox)
|
||
|
{
|
||
|
while ((pboxNext < pbox+nbox) &&
|
||
|
(pboxNext->y1 == pboxBase->y1))
|
||
|
pboxNext++;
|
||
|
pboxTmp = pboxNext;
|
||
|
pptTmp = pptSrc + (pboxTmp - pbox);
|
||
|
while (pboxTmp != pboxBase)
|
||
|
{
|
||
|
*pboxNew2++ = *--pboxTmp;
|
||
|
*pptNew2++ = *--pptTmp;
|
||
|
}
|
||
|
pboxBase = pboxNext;
|
||
|
}
|
||
|
pboxNew2 -= nbox;
|
||
|
pbox = pboxNew2;
|
||
|
pptNew2 -= nbox;
|
||
|
pptSrc = pptNew2;
|
||
|
}
|
||
|
}
|
||
|
else
|
||
|
{
|
||
|
/* walk source left to right */
|
||
|
xdir = 1;
|
||
|
}
|
||
|
|
||
|
while(nbox--)
|
||
|
{
|
||
|
w = pbox->x2 - pbox->x1;
|
||
|
h = pbox->y2 - pbox->y1;
|
||
|
|
||
|
#if PSZ == 24
|
||
|
#ifdef DO_MEMCPY
|
||
|
w2 = w * BYPP;
|
||
|
#endif
|
||
|
#endif
|
||
|
if (ydir == -1) /* start at last scanline of rectangle */
|
||
|
{
|
||
|
psrcLine = psrcBase + ((pptSrc->y+h-1) * -widthSrc);
|
||
|
pdstLine = pdstBase + ((pbox->y2-1) * -widthDst);
|
||
|
}
|
||
|
else /* start at first scanline */
|
||
|
{
|
||
|
psrcLine = psrcBase + (pptSrc->y * widthSrc);
|
||
|
pdstLine = pdstBase + (pbox->y1 * widthDst);
|
||
|
}
|
||
|
#if PSZ == 24
|
||
|
if (w == 1 && ((pbox->x1 & PAM) == 0 || (pbox->x1 & PAM) == PAM))
|
||
|
#else
|
||
|
if ((pbox->x1 & PIM) + w <= PPW)
|
||
|
#endif
|
||
|
{
|
||
|
maskpartialbits (pbox->x1, w, endmask);
|
||
|
startmask = 0;
|
||
|
nlMiddle = 0;
|
||
|
}
|
||
|
else
|
||
|
{
|
||
|
maskbits(pbox->x1, w, startmask, endmask, nlMiddle);
|
||
|
}
|
||
|
|
||
|
#if PSZ == 24
|
||
|
#if 0
|
||
|
nlMiddle = w - (pbox->x2 &PAM);;
|
||
|
if(pbox->x1 & PAM){
|
||
|
nlMiddle -= (PAM+1 - (pbox->x1 &PAM));
|
||
|
}
|
||
|
nlMiddle >>= P2WSH;
|
||
|
if(nlMiddle < 0)
|
||
|
nlMiddle = 0;
|
||
|
#endif
|
||
|
#endif
|
||
|
|
||
|
#ifdef DO_MEMCPY
|
||
|
/* If the src and dst scanline don't overlap, do forward case. */
|
||
|
|
||
|
if ((xdir == 1) || (pptSrc->y != pbox->y1)
|
||
|
|| (pptSrc->x + w <= pbox->x1))
|
||
|
{
|
||
|
#if PSZ == 24
|
||
|
char *psrc = (char *) psrcLine + (pptSrc->x * BYPP);
|
||
|
char *pdst = (char *) pdstLine + (pbox->x1 * BYPP);
|
||
|
#else
|
||
|
char *psrc = (char *) psrcLine + pptSrc->x;
|
||
|
char *pdst = (char *) pdstLine + pbox->x1;
|
||
|
#endif
|
||
|
while (h--)
|
||
|
{
|
||
|
#if PSZ == 24
|
||
|
memcpy(pdst, psrc, w2);
|
||
|
#else
|
||
|
memcpy(pdst, psrc, w);
|
||
|
#endif
|
||
|
pdst += widthDst << PWSH;
|
||
|
psrc += widthSrc << PWSH;
|
||
|
}
|
||
|
}
|
||
|
#else /* ! DO_MEMCPY */
|
||
|
if (xdir == 1)
|
||
|
{
|
||
|
#if PSZ == 24 && MROP == 0
|
||
|
/* Note: x is a pixel number; the byte offset is 3*x;
|
||
|
therefore the offset within a word is (3*x) & 3 ==
|
||
|
(4*x-x) & 3 == (-x) & 3. The offsets therefore
|
||
|
DECREASE by 1 for each pixel.
|
||
|
*/
|
||
|
xoffSrc = ( - pptSrc->x) & PAM;
|
||
|
xoffDst = ( - pbox->x1) & PAM;
|
||
|
#if 1
|
||
|
if((int)xoffSrc != (int)xoffDst /* Alignments must be same. */
|
||
|
|| ((widthDstBytes & PAM) != (widthSrcBytes & PAM) && h > 1))
|
||
|
#else
|
||
|
if(1)
|
||
|
#endif
|
||
|
/* Width also must be same, if hight > 1 */
|
||
|
{
|
||
|
/* ...otherwise, pixel by pixel operation */
|
||
|
while (h--)
|
||
|
{
|
||
|
register int i, si, sii, di;
|
||
|
|
||
|
for (i = 0, si = pptSrc->x, di = pbox->x1;
|
||
|
i < w;
|
||
|
i++, si++, di++) {
|
||
|
psrc = psrcLine + ((si * BYPP) >> P2WSH);
|
||
|
pdst = pdstLine + ((di * BYPP) >> P2WSH);
|
||
|
sii = (si & 3);
|
||
|
MROP_SOLID24P(psrc, pdst, sii, di);
|
||
|
}
|
||
|
pdstLine += widthDst;
|
||
|
psrcLine += widthSrc;
|
||
|
}
|
||
|
}
|
||
|
else
|
||
|
#endif
|
||
|
{
|
||
|
|
||
|
#if PSZ == 24
|
||
|
|
||
|
#if MROP != 0
|
||
|
xoffSrc = ( - pptSrc->x) & PAM;
|
||
|
xoffDst = ( - pbox->x1) & PAM;
|
||
|
#endif
|
||
|
pdstLine += (pbox->x1 * BYPP) >> P2WSH;
|
||
|
psrcLine += (pptSrc->x * BYPP) >> P2WSH;
|
||
|
#else
|
||
|
xoffSrc = pptSrc->x & PIM;
|
||
|
xoffDst = pbox->x1 & PIM;
|
||
|
pdstLine += (pbox->x1 >> PWSH);
|
||
|
psrcLine += (pptSrc->x >> PWSH);
|
||
|
#endif
|
||
|
#ifdef DO_UNALIGNED_BITBLT
|
||
|
nl = xoffSrc - xoffDst;
|
||
|
psrcLine = (CfbBits *)
|
||
|
(((unsigned char *) psrcLine) + nl);
|
||
|
#else
|
||
|
#if PSZ == 24 && MROP == 0
|
||
|
/* alredy satisfied */
|
||
|
#else
|
||
|
if (xoffSrc == xoffDst)
|
||
|
#endif
|
||
|
#endif
|
||
|
{
|
||
|
while (h--)
|
||
|
{
|
||
|
#if PSZ == 24 && MROP == 0
|
||
|
register int index;
|
||
|
register int im3;
|
||
|
#endif /* PSZ == 24 && MROP == 0 */
|
||
|
psrc = psrcLine;
|
||
|
pdst = pdstLine;
|
||
|
pdstLine += widthDst;
|
||
|
psrcLine += widthSrc;
|
||
|
#if PSZ == 24 && MROP == 0
|
||
|
index = (int)(pdst - pdstBase);
|
||
|
im3 = index % 3;
|
||
|
#endif /* PSZ == 24 && MROP == 0 */
|
||
|
if (startmask)
|
||
|
{
|
||
|
#if PSZ == 24 && MROP == 0
|
||
|
*pdst = DoMaskMergeRop24u(*psrc, *pdst, startmask, im3);
|
||
|
index++;
|
||
|
im3 = index % 3;
|
||
|
#else /* PSZ != 24 || MROP != 0 */
|
||
|
*pdst = MROP_MASK(*psrc, *pdst, startmask);
|
||
|
#endif /* PSZ == 24 && MROP == 0 */
|
||
|
psrc++;
|
||
|
pdst++;
|
||
|
}
|
||
|
|
||
|
nl = nlMiddle;
|
||
|
#ifdef LARGE_INSTRUCTION_CACHE
|
||
|
#ifdef FAST_CONSTANT_OFFSET_MODE
|
||
|
|
||
|
psrc += nl & (UNROLL-1);
|
||
|
pdst += nl & (UNROLL-1);
|
||
|
|
||
|
#if PSZ == 24 && MROP == 0
|
||
|
#define BodyOdd(n) pdst[-n] = DoMergeRop24u(psrc[-n], pdst[-n], ((int)(pdst - n - pdstBase))%3);
|
||
|
#define BodyEven(n) pdst[-n] = DoMergeRop24u(psrc[-n], pdst[-n], ((int)(pdst - n - pdstBase))%3);
|
||
|
#else /* PSZ != 24 || MROP != 0 */
|
||
|
#define BodyOdd(n) pdst[-n] = MROP_SOLID (psrc[-n], pdst[-n]);
|
||
|
#define BodyEven(n) pdst[-n] = MROP_SOLID (psrc[-n], pdst[-n]);
|
||
|
#endif /* PSZ == 24 && MROP == 0 */
|
||
|
|
||
|
#define LoopReset \
|
||
|
pdst += UNROLL; \
|
||
|
psrc += UNROLL;
|
||
|
|
||
|
#else
|
||
|
|
||
|
#if PSZ == 24 && MROP == 0
|
||
|
#define BodyOdd(n) *pdst = DoMergeRop24u(*psrc, *pdst, im3); pdst++; psrc++; index++; im3 = index % 3;
|
||
|
#define BodyEven(n) BodyOdd(n)
|
||
|
#else /* PSZ != 24 || MROP != 0 */
|
||
|
#define BodyOdd(n) *pdst = MROP_SOLID (*psrc, *pdst); pdst++; psrc++;
|
||
|
#define BodyEven(n) BodyOdd(n)
|
||
|
#endif /* PSZ == 24 && MROP == 0 */
|
||
|
|
||
|
#define LoopReset ;
|
||
|
|
||
|
#endif
|
||
|
PackedLoop
|
||
|
|
||
|
#undef BodyOdd
|
||
|
#undef BodyEven
|
||
|
#undef LoopReset
|
||
|
|
||
|
#else
|
||
|
#ifdef NOTDEF
|
||
|
/* you'd think this would be faster --
|
||
|
* a single instruction instead of 6
|
||
|
* but measurements show it to be ~15% slower
|
||
|
*/
|
||
|
while ((nl -= 6) >= 0)
|
||
|
{
|
||
|
asm ("moveml %1+,#0x0c0f;moveml#0x0c0f,%0"
|
||
|
: "=m" (*(char *)pdst)
|
||
|
: "m" (*(char *)psrc)
|
||
|
: "d0", "d1", "d2", "d3",
|
||
|
"a2", "a3");
|
||
|
pdst += 6;
|
||
|
}
|
||
|
nl += 6;
|
||
|
while (nl--)
|
||
|
*pdst++ = *psrc++;
|
||
|
#endif
|
||
|
#if 0 /*PSZ == 24 && MROP == 0*/
|
||
|
DuffL(nl, label1,
|
||
|
*pdst = DoMergeRop24u(*psrc, *pdst, im3);
|
||
|
pdst++; psrc++; index++;im3 = index % 3;)
|
||
|
#else /* !(PSZ == 24 && MROP == 0) */
|
||
|
DuffL(nl, label1,
|
||
|
*pdst = MROP_SOLID (*psrc, *pdst);
|
||
|
pdst++; psrc++;)
|
||
|
#endif /* PSZ == 24 && MROP == 0 */
|
||
|
#endif
|
||
|
|
||
|
if (endmask)
|
||
|
#if PSZ == 24 && MROP == 0
|
||
|
*pdst = DoMaskMergeRop24u(*psrc, *pdst, endmask, (int)(pdst - pdstBase) % 3);
|
||
|
#else /* !(PSZ == 24 && MROP == 0) */
|
||
|
*pdst = MROP_MASK(*psrc, *pdst, endmask);
|
||
|
#endif /* PSZ == 24 && MROP == 0 */
|
||
|
}
|
||
|
}
|
||
|
#ifndef DO_UNALIGNED_BITBLT
|
||
|
#if PSZ == 24 && MROP == 0
|
||
|
/* can not happen */
|
||
|
#else /* !(PSZ == 24 && MROP == 0) */
|
||
|
else /* xoffSrc != xoffDst */
|
||
|
{
|
||
|
if (xoffSrc > xoffDst)
|
||
|
{
|
||
|
#if PSZ == 24
|
||
|
leftShift = (xoffSrc - xoffDst) << 3;
|
||
|
#else
|
||
|
#if PGSZ == 32
|
||
|
leftShift = (xoffSrc - xoffDst) << (5 - PWSH);
|
||
|
#else /* PGSZ == 64 */
|
||
|
leftShift = (xoffSrc - xoffDst) << (6 - PWSH);
|
||
|
#endif /* PGSZ */
|
||
|
#endif
|
||
|
rightShift = PGSZ - leftShift;
|
||
|
}
|
||
|
else
|
||
|
{
|
||
|
#if PSZ == 24
|
||
|
rightShift = (xoffDst - xoffSrc) << 3;
|
||
|
#else
|
||
|
#if PGSZ == 32
|
||
|
rightShift = (xoffDst - xoffSrc) << (5 - PWSH);
|
||
|
#else /* PGSZ == 64 */
|
||
|
rightShift = (xoffDst - xoffSrc) << (6 - PWSH);
|
||
|
#endif /* PGSZ */
|
||
|
#endif
|
||
|
leftShift = PGSZ - rightShift;
|
||
|
}
|
||
|
while (h--)
|
||
|
{
|
||
|
psrc = psrcLine;
|
||
|
pdst = pdstLine;
|
||
|
pdstLine += widthDst;
|
||
|
psrcLine += widthSrc;
|
||
|
bits = 0;
|
||
|
if (xoffSrc > xoffDst)
|
||
|
bits = *psrc++;
|
||
|
if (startmask)
|
||
|
{
|
||
|
bits1 = BitLeft(bits,leftShift);
|
||
|
bits = *psrc++;
|
||
|
bits1 |= BitRight(bits,rightShift);
|
||
|
*pdst = MROP_MASK(bits1, *pdst, startmask);
|
||
|
pdst++;
|
||
|
}
|
||
|
nl = nlMiddle;
|
||
|
#ifdef LARGE_INSTRUCTION_CACHE
|
||
|
bits1 = bits;
|
||
|
|
||
|
#ifdef FAST_CONSTANT_OFFSET_MODE
|
||
|
|
||
|
psrc += nl & (UNROLL-1);
|
||
|
pdst += nl & (UNROLL-1);
|
||
|
|
||
|
#define BodyOdd(n) \
|
||
|
bits = psrc[-n]; \
|
||
|
pdst[-n] = MROP_SOLID(BitLeft(bits1, leftShift) | BitRight(bits, rightShift), pdst[-n]);
|
||
|
|
||
|
#define BodyEven(n) \
|
||
|
bits1 = psrc[-n]; \
|
||
|
pdst[-n] = MROP_SOLID(BitLeft(bits, leftShift) | BitRight(bits1, rightShift), pdst[-n]);
|
||
|
|
||
|
#define LoopReset \
|
||
|
pdst += UNROLL; \
|
||
|
psrc += UNROLL;
|
||
|
|
||
|
#else
|
||
|
|
||
|
#define BodyOdd(n) \
|
||
|
bits = *psrc++; \
|
||
|
*pdst = MROP_SOLID(BitLeft(bits1, leftShift) | BitRight(bits, rightShift), *pdst); \
|
||
|
pdst++;
|
||
|
|
||
|
#define BodyEven(n) \
|
||
|
bits1 = *psrc++; \
|
||
|
*pdst = MROP_SOLID(BitLeft(bits, leftShift) | BitRight(bits1, rightShift), *pdst); \
|
||
|
pdst++;
|
||
|
|
||
|
#define LoopReset ;
|
||
|
|
||
|
#endif /* !FAST_CONSTANT_OFFSET_MODE */
|
||
|
|
||
|
PackedLoop
|
||
|
|
||
|
#undef BodyOdd
|
||
|
#undef BodyEven
|
||
|
#undef LoopReset
|
||
|
|
||
|
#else
|
||
|
DuffL (nl,label2,
|
||
|
bits1 = BitLeft(bits, leftShift);
|
||
|
bits = *psrc++;
|
||
|
*pdst = MROP_SOLID (bits1 | BitRight(bits, rightShift), *pdst);
|
||
|
pdst++;
|
||
|
)
|
||
|
#endif
|
||
|
|
||
|
if (endmask)
|
||
|
{
|
||
|
bits1 = BitLeft(bits, leftShift);
|
||
|
if (BitLeft(endmask, rightShift))
|
||
|
{
|
||
|
bits = *psrc;
|
||
|
bits1 |= BitRight(bits, rightShift);
|
||
|
}
|
||
|
*pdst = MROP_MASK (bits1, *pdst, endmask);
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
#endif /* (PSZ == 24 && MROP == 0) */
|
||
|
#endif /* DO_UNALIGNED_BITBLT */
|
||
|
|
||
|
}
|
||
|
}
|
||
|
#endif /* ! DO_MEMCPY */
|
||
|
else /* xdir == -1 */
|
||
|
{
|
||
|
#if PSZ == 24 && MROP == 0
|
||
|
xoffSrc = (-(pptSrc->x + w)) & PAM;
|
||
|
xoffDst = (-pbox->x2) & PAM;
|
||
|
#if 1
|
||
|
if(xoffSrc != xoffDst /* Alignments must be same. */
|
||
|
|| ((widthDstBytes & PAM) != (widthSrcBytes & PAM) && h > 1))
|
||
|
#else
|
||
|
if(1)
|
||
|
#endif
|
||
|
/* Width also must be same, if hight > 1 */
|
||
|
{
|
||
|
/* ...otherwise, pixel by pixel operation */
|
||
|
while (h--)
|
||
|
{
|
||
|
register int i, si, sii, di;
|
||
|
|
||
|
for (i = 0, si = pptSrc->x + w - 1, di = pbox->x2 - 1;
|
||
|
i < w;
|
||
|
i++, si--, di--) {
|
||
|
psrc = psrcLine + ((si * BYPP) >> P2WSH);
|
||
|
pdst = pdstLine + ((di * BYPP) >> P2WSH);
|
||
|
sii = (si & PAM);
|
||
|
MROP_SOLID24P(psrc, pdst, sii, di);
|
||
|
}
|
||
|
psrcLine += widthSrc;
|
||
|
pdstLine += widthDst;
|
||
|
}
|
||
|
}else
|
||
|
#endif /* MROP == 0 && PSZ == 24 */
|
||
|
{
|
||
|
|
||
|
#if PSZ == 24
|
||
|
#if MROP == 0
|
||
|
/* already calculated */
|
||
|
#else
|
||
|
xoffSrc = (pptSrc->x + w) & PAM;
|
||
|
xoffDst = pbox->x2 & PAM;
|
||
|
#endif
|
||
|
pdstLine += ((pbox->x2 * BYPP - 1) >> P2WSH) + 1;
|
||
|
psrcLine += (((pptSrc->x+w) * BYPP - 1) >> P2WSH) + 1;
|
||
|
#else
|
||
|
xoffSrc = (pptSrc->x + w - 1) & PIM;
|
||
|
xoffDst = (pbox->x2 - 1) & PIM;
|
||
|
pdstLine += ((pbox->x2-1) >> PWSH) + 1;
|
||
|
psrcLine += ((pptSrc->x+w - 1) >> PWSH) + 1;
|
||
|
#endif
|
||
|
#ifdef DO_UNALIGNED_BITBLT
|
||
|
#if PSZ == 24
|
||
|
nl = xoffDst - xoffSrc;
|
||
|
#else
|
||
|
nl = xoffSrc - xoffDst;
|
||
|
#endif
|
||
|
psrcLine = (CfbBits *)
|
||
|
(((unsigned char *) psrcLine) + nl);
|
||
|
#else
|
||
|
#if PSZ == 24 && MROP == 0
|
||
|
/* already satisfied */
|
||
|
#else
|
||
|
if (xoffSrc == xoffDst)
|
||
|
#endif
|
||
|
#endif
|
||
|
{
|
||
|
while (h--)
|
||
|
{
|
||
|
#if PSZ == 24 && MROP == 0
|
||
|
register int index;
|
||
|
register int im3;
|
||
|
#endif /* PSZ == 24 && MROP == 0 */
|
||
|
psrc = psrcLine;
|
||
|
pdst = pdstLine;
|
||
|
pdstLine += widthDst;
|
||
|
psrcLine += widthSrc;
|
||
|
#if PSZ == 24 && MROP == 0
|
||
|
index = (int)(pdst - pdstBase);
|
||
|
#endif /* PSZ == 24 && MROP == 0 */
|
||
|
|
||
|
if (endmask)
|
||
|
{
|
||
|
pdst--;
|
||
|
psrc--;
|
||
|
#if PSZ == 24 && MROP == 0
|
||
|
index--;
|
||
|
im3 = index % 3;
|
||
|
*pdst = DoMaskMergeRop24u(*psrc, *pdst, endmask, im3);
|
||
|
#else /* !(PSZ == 24 && MROP == 0) */
|
||
|
*pdst = MROP_MASK (*psrc, *pdst, endmask);
|
||
|
#endif /* PSZ == 24 && MROP == 0 */
|
||
|
}
|
||
|
nl = nlMiddle;
|
||
|
#ifdef LARGE_INSTRUCTION_CACHE
|
||
|
#ifdef FAST_CONSTANT_OFFSET_MODE
|
||
|
psrc -= nl & (UNROLL - 1);
|
||
|
pdst -= nl & (UNROLL - 1);
|
||
|
|
||
|
#if PSZ == 24 && MROP == 0
|
||
|
#define BodyOdd(n) pdst[n-1] = DoMergeRop24u(psrc[n-1], pdst[n-1], ((int)(pdst - (n - 1) -pdstBase)) % 3);
|
||
|
#else /* !(PSZ == 24 && MROP == 0) */
|
||
|
#define BodyOdd(n) pdst[n-1] = MROP_SOLID (psrc[n-1], pdst[n-1]);
|
||
|
#endif /* PSZ == 24 && MROP == 0 */
|
||
|
|
||
|
#define BodyEven(n) BodyOdd(n)
|
||
|
|
||
|
#define LoopReset \
|
||
|
pdst -= UNROLL;\
|
||
|
psrc -= UNROLL;
|
||
|
|
||
|
#else
|
||
|
|
||
|
#if PSZ == 24 && MROP == 0
|
||
|
#define BodyOdd(n) --pdst; --psrc; --index; im3 = index % 3;*pdst = DoMergeRop24u(*psrc, *pdst, im3);
|
||
|
#else /* !(PSZ == 24 && MROP == 0) */
|
||
|
#define BodyOdd(n) --pdst; --psrc; *pdst = MROP_SOLID(*psrc, *pdst);
|
||
|
#endif /* PSZ == 24 && MROP == 0 */
|
||
|
#define BodyEven(n) BodyOdd(n)
|
||
|
#define LoopReset ;
|
||
|
|
||
|
#endif
|
||
|
PackedLoop
|
||
|
|
||
|
#undef BodyOdd
|
||
|
#undef BodyEven
|
||
|
#undef LoopReset
|
||
|
|
||
|
#else
|
||
|
#if PSZ == 24 && MROP == 0
|
||
|
DuffL(nl,label3,
|
||
|
--pdst; --psrc; --index; im3= index%3;*pdst = DoMergeRop24u(*psrc, *pdst, im3);)
|
||
|
#else /* !(PSZ == 24 && MROP == 0) */
|
||
|
DuffL(nl,label3,
|
||
|
--pdst; --psrc; *pdst = MROP_SOLID (*psrc, *pdst);)
|
||
|
#endif /* PSZ == 24 && MROP == 0 */
|
||
|
#endif
|
||
|
|
||
|
if (startmask)
|
||
|
{
|
||
|
--pdst;
|
||
|
--psrc;
|
||
|
#if PSZ == 24 && MROP == 0
|
||
|
*pdst = DoMaskMergeRop24u(*psrc, *pdst, startmask, (int)(pdst - pdstBase) % 3);
|
||
|
#else /* !(PSZ == 24 && MROP == 0) */
|
||
|
*pdst = MROP_MASK(*psrc, *pdst, startmask);
|
||
|
#endif /* PSZ == 24 && MROP == 0 */
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
#ifndef DO_UNALIGNED_BITBLT
|
||
|
#if PSZ == 24 && MROP == 0
|
||
|
/* can not happen */
|
||
|
#else /* !( PSZ == 24 && MROP == 0) */
|
||
|
else
|
||
|
{
|
||
|
if (xoffDst > xoffSrc)
|
||
|
{
|
||
|
#if PSZ == 24
|
||
|
leftShift = (xoffDst - xoffSrc) << 3;
|
||
|
rightShift = PGSZ - leftShift;
|
||
|
#else
|
||
|
#if PGSZ == 32
|
||
|
rightShift = (xoffDst - xoffSrc) << (5 - PWSH);
|
||
|
#else /* PGSZ == 64 */
|
||
|
rightShift = (xoffDst - xoffSrc) << (6 - PWSH);
|
||
|
#endif /* PGSZ */
|
||
|
leftShift = PGSZ - rightShift;
|
||
|
#endif
|
||
|
}
|
||
|
else
|
||
|
{
|
||
|
#if PSZ == 24
|
||
|
rightShift = (xoffSrc - xoffDst) << 3;
|
||
|
leftShift = PGSZ - rightShift;
|
||
|
#else
|
||
|
#if PGSZ == 32
|
||
|
leftShift = (xoffSrc - xoffDst) << (5 - PWSH);
|
||
|
#else /* PGSZ == 64 */
|
||
|
leftShift = (xoffSrc - xoffDst) << (6 - PWSH);
|
||
|
#endif /* PGSZ */
|
||
|
rightShift = PGSZ - leftShift;
|
||
|
#endif
|
||
|
}
|
||
|
while (h--)
|
||
|
{
|
||
|
psrc = psrcLine;
|
||
|
pdst = pdstLine;
|
||
|
pdstLine += widthDst;
|
||
|
psrcLine += widthSrc;
|
||
|
bits = 0;
|
||
|
#if PSZ == 24
|
||
|
if (xoffSrc > xoffDst)
|
||
|
#else
|
||
|
if (xoffDst > xoffSrc)
|
||
|
#endif
|
||
|
bits = *--psrc;
|
||
|
if (endmask)
|
||
|
{
|
||
|
bits1 = BitRight(bits, rightShift);
|
||
|
bits = *--psrc;
|
||
|
bits1 |= BitLeft(bits, leftShift);
|
||
|
pdst--;
|
||
|
*pdst = MROP_MASK(bits1, *pdst, endmask);
|
||
|
}
|
||
|
nl = nlMiddle;
|
||
|
#ifdef LARGE_INSTRUCTION_CACHE
|
||
|
bits1 = bits;
|
||
|
#ifdef FAST_CONSTANT_OFFSET_MODE
|
||
|
psrc -= nl & (UNROLL - 1);
|
||
|
pdst -= nl & (UNROLL - 1);
|
||
|
|
||
|
#define BodyOdd(n) \
|
||
|
bits = psrc[n-1]; \
|
||
|
pdst[n-1] = MROP_SOLID(BitRight(bits1, rightShift) | BitLeft(bits, leftShift),pdst[n-1]);
|
||
|
|
||
|
#define BodyEven(n) \
|
||
|
bits1 = psrc[n-1]; \
|
||
|
pdst[n-1] = MROP_SOLID(BitRight(bits, rightShift) | BitLeft(bits1, leftShift),pdst[n-1]);
|
||
|
|
||
|
#define LoopReset \
|
||
|
pdst -= UNROLL; \
|
||
|
psrc -= UNROLL;
|
||
|
|
||
|
#else
|
||
|
|
||
|
#define BodyOdd(n) \
|
||
|
bits = *--psrc; --pdst; \
|
||
|
*pdst = MROP_SOLID(BitRight(bits1, rightShift) | BitLeft(bits, leftShift),*pdst);
|
||
|
|
||
|
#define BodyEven(n) \
|
||
|
bits1 = *--psrc; --pdst; \
|
||
|
*pdst = MROP_SOLID(BitRight(bits, rightShift) | BitLeft(bits1, leftShift),*pdst);
|
||
|
|
||
|
#define LoopReset ;
|
||
|
|
||
|
#endif
|
||
|
|
||
|
PackedLoop
|
||
|
|
||
|
#undef BodyOdd
|
||
|
#undef BodyEven
|
||
|
#undef LoopReset
|
||
|
|
||
|
#else
|
||
|
DuffL (nl, label4,
|
||
|
bits1 = BitRight(bits, rightShift);
|
||
|
bits = *--psrc;
|
||
|
--pdst;
|
||
|
*pdst = MROP_SOLID(bits1 | BitLeft(bits, leftShift),*pdst);
|
||
|
)
|
||
|
#endif
|
||
|
|
||
|
if (startmask)
|
||
|
{
|
||
|
bits1 = BitRight(bits, rightShift);
|
||
|
if (BitRight (startmask, leftShift))
|
||
|
{
|
||
|
bits = *--psrc;
|
||
|
bits1 |= BitLeft(bits, leftShift);
|
||
|
}
|
||
|
--pdst;
|
||
|
*pdst = MROP_MASK(bits1, *pdst, startmask);
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
#endif /* PSZ == 24 && MROP == 0 */
|
||
|
#endif
|
||
|
}
|
||
|
}
|
||
|
pbox++;
|
||
|
pptSrc++;
|
||
|
}
|
||
|
if (pboxNew2)
|
||
|
{
|
||
|
DEALLOCATE_LOCAL(pptNew2);
|
||
|
DEALLOCATE_LOCAL(pboxNew2);
|
||
|
}
|
||
|
if (pboxNew1)
|
||
|
{
|
||
|
DEALLOCATE_LOCAL(pptNew1);
|
||
|
DEALLOCATE_LOCAL(pboxNew1);
|
||
|
}
|
||
|
}
|