/* * Fill odd tiled rectangles and spans. * no depth dependencies. */ /* Copyright 1989 by the Massachusetts Institute of Technology Permission to use, copy, modify, and distribute this software and its documentation for any purpose and without fee is hereby granted, provided that the above copyright notice appear in all copies and that both that copyright notice and this permission notice appear in supporting documentation, and that the name of M.I.T. not be used in advertising or publicity pertaining to distribution of the software without specific, written prior permission. M.I.T. makes no representations about the suitability of this software for any purpose. It is provided "as is" without express or implied warranty. */ /* $XConsortium: cfbtileodd.c,v 1.13 91/07/10 17:26:10 keith Exp $ */ #include "X.h" #include "Xmd.h" #include "servermd.h" #include "gcstruct.h" #include "window.h" #include "pixmapstr.h" #include "scrnintstr.h" #include "windowstr.h" #include "cfb.h" #include "cfbmskbits.h" #include "cfb8bit.h" #include "mergerop.h" #define LastTileBits {\ tmp = bits; \ if (tileEndPart) \ bits = (*pSrc & tileEndMask) | BitRight (*pSrcLine, tileEndLeftShift); \ else \ bits = *pSrc; \ } #define ResetTileBits {\ pSrc = pSrcLine; \ nlwSrc = widthSrc;\ if (tileEndPart) { \ if (PPW - xoff + tileEndPart <= PPW) {\ bits = *pSrc++; \ nlwSrc--; \ } else \ bits = BitLeft(tmp, tileEndLeftShift) | \ BitRight(bits, tileEndRightShift); \ xoff = (xoff + xoffStep) & PIM; \ leftShift = xoff << (5-PWSH); \ rightShift = 32 - leftShift; \ }\ } #define NextTileBits {\ if (nlwSrc == 1) {\ LastTileBits\ } else { \ if (nlwSrc == 0) {\ ResetTileBits\ } \ if (nlwSrc == 1) {\ LastTileBits\ } else {\ tmp = bits; \ bits = *pSrc++; \ }\ }\ nlwSrc--; \ } void MROP_NAME(cfbFillBoxTileOdd) (pDrawable, nBox, pBox, tile, xrot, yrot, alu, planemask) DrawablePtr pDrawable; int nBox; /* number of boxes to fill */ register BoxPtr pBox; /* pointer to list of boxes to fill */ PixmapPtr tile; /* tile */ int xrot, yrot; int alu; unsigned long planemask; { hpPrivPixmapPtr tilePriv; int tileWidth; /* width of tile in pixels */ int tileHeight; /* height of the tile */ int widthSrc; int strideSrc; int widthDst; /* width in longwords of the dest pixmap */ int w; /* width of current box */ int h; /* height of current box */ unsigned long startmask; unsigned long endmask; /* masks for reggedy bits at either end of line */ int nlwMiddle; /* number of longwords between sides of boxes */ int nlwSrc; /* number of whole longwords in source */ register int nlw; /* loop version of nlwMiddle */ int srcy; /* current tile y position */ int srcx; /* current tile x position */ int xoffDst, xoffSrc; int leftShift, rightShift; MROP_DECLARE_REG() unsigned long *pDstBase; /* pointer to start of dest */ unsigned long *pDstLine; /* poitner to start of dest box */ unsigned long *pSrcBase; /* pointer to start of source */ unsigned long *pSrcLine; /* pointer to start of source line */ register unsigned long *pDst; register unsigned long *pSrc; register unsigned long bits, tmp; register int nlwPart; int xoffStart, xoff; int leftShiftStart, rightShiftStart, nlwSrcStart; unsigned long tileEndMask; int tileEndLeftShift, tileEndRightShift; int xoffStep; int tileEndPart; int needFirst; unsigned long narrow[2]; unsigned long narrowMask; int narrowShift; Bool narrowTile; MROP_INITIALIZE (alu, planemask) tileHeight = tile->drawable.height; tileWidth = tile->drawable.width; tilePriv = (hpPrivPixmapPtr)tile->devPrivate.ptr; if (tile->devKind == PIXMAP_FRAME_BUFFER) widthSrc = tilePriv->pChunk->w >> 2; else widthSrc = tilePriv->stride >> 2; strideSrc = tilePriv->stride >> 2; narrowTile = FALSE; if (widthSrc == 1) { narrowShift = tileWidth; narrowMask = cfbendpartial [tileWidth]; tileWidth *= 2; widthSrc = 2; narrowTile = TRUE; } pSrcBase = (unsigned long *)tilePriv->bits; cfbGetLongWidthAndPointer (pDrawable, widthDst, pDstBase) SET_REGISTERS_FOR_WRITING(pDrawable->pScreen, ~0, GXcopy); if (tile->devKind == PIXMAP_FRAME_BUFFER) WAIT_READY_TO_RENDER(tile->drawable.pScreen); tileEndPart = tileWidth & PIM; tileEndMask = cfbendpartial[tileEndPart]; tileEndLeftShift = (tileEndPart) << (5-PWSH); tileEndRightShift = 32 - tileEndLeftShift; xoffStep = PPW - tileEndPart; /* * current assumptions: tile > 32 bits wide. */ while (nBox--) { w = pBox->x2 - pBox->x1; h = pBox->y2 - pBox->y1; modulus (pBox->x1 - xrot, tileWidth, srcx); modulus (pBox->y1 - yrot, tileHeight, srcy); xoffDst = pBox->x1 & PIM; if (xoffDst + w < PPW) { maskpartialbits(pBox->x1, w, startmask); endmask = 0; nlwMiddle = 0; } else { maskbits (pBox->x1, w, startmask, endmask, nlwMiddle) } pDstLine = pDstBase + (pBox->y1 * widthDst) + (pBox->x1 >> PWSH); pSrcLine = pSrcBase + (srcy * strideSrc); xoffSrc = srcx & PIM; if (xoffSrc >= xoffDst) { xoffStart = xoffSrc - xoffDst; needFirst = 1; } else { xoffStart = PPW - (xoffDst - xoffSrc); needFirst = 0; } leftShiftStart = (xoffStart) << (5-PWSH); rightShiftStart = 32 - leftShiftStart; nlwSrcStart = widthSrc - (srcx >> PWSH); while (h--) { /* XXX only works when narrowShift >= PPW/2 */ if (narrowTile) { tmp = pSrcBase[srcy] & narrowMask; /* source width == 1 */ narrow[0] = tmp | SCRRIGHT (tmp, narrowShift); narrow[1] = SCRLEFT (tmp, PPW - narrowShift) | SCRRIGHT(tmp, 2 * narrowShift - PPW); pSrcLine = narrow; } xoff = xoffStart; leftShift = leftShiftStart; rightShift = rightShiftStart; nlwSrc = nlwSrcStart; pSrc = pSrcLine + (srcx >> PWSH); pDst = pDstLine; bits = 0; if (needFirst) { NextTileBits } if (startmask) { NextTileBits tmp = BitLeft(tmp, leftShift); if (rightShift != 32) tmp |= BitRight(bits,rightShift); *pDst = MROP_MASK (tmp, *pDst, startmask); ++pDst; } nlw = nlwMiddle; while (nlw) { #if MROP == Mcopy if (nlwSrc > 1) { nlwPart = nlw; if (nlwPart >= nlwSrc) nlwPart = nlwSrc - 1; nlw -= nlwPart; nlwSrc -= nlwPart; if (rightShift != 32) { while (nlwPart--) { tmp = bits; bits = *pSrc++; *pDst = MROP_SOLID(BitLeft(tmp, leftShift) | BitRight (bits, rightShift), *pDst); ++pDst; } } else { if (nlwPart) { *pDst = MROP_SOLID (bits, *pDst); ++pDst; nlwPart--; while (nlwPart--) { *pDst = MROP_SOLID(*pSrc, *pDst); ++pDst; ++pSrc; } bits = *pSrc++; } } } else #endif { NextTileBits if (rightShift != 32) { *pDst = MROP_SOLID(BitLeft(tmp, leftShift) | BitRight(bits, rightShift), *pDst); } else { *pDst = MROP_SOLID (tmp, *pDst); } ++pDst; nlw--; } } if (endmask) { NextTileBits if (rightShift == 32) bits = 0; *pDst = MROP_MASK (BitLeft(tmp, leftShift) | BitRight(bits,rightShift), *pDst, endmask); } pDstLine += widthDst; pSrcLine += strideSrc; if (++srcy == tileHeight) { srcy = 0; pSrcLine = pSrcBase; } } pBox++; } } void MROP_NAME(cfbFillSpanTileOdd) (pDrawable, n, ppt, pwidth, tile, xrot, yrot, alu, planemask) DrawablePtr pDrawable; int n; DDXPointPtr ppt; int *pwidth; PixmapPtr tile; int xrot, yrot; int alu; unsigned long planemask; { hpPrivPixmapPtr tilePriv; int tileWidth; /* width of tile in pixels */ int tileHeight; /* height of the tile */ int widthSrc; int strideSrc; int widthDst; /* width in longwords of the dest pixmap */ int w; /* width of current span */ unsigned long startmask; unsigned long endmask; /* masks for reggedy bits at either end of line */ int nlwSrc; /* number of whole longwords in source */ register int nlw; /* loop version of nlwMiddle */ int srcy; /* current tile y position */ int srcx; /* current tile x position */ int xoffDst, xoffSrc; int leftShift, rightShift; MROP_DECLARE_REG() unsigned long *pDstBase; /* pointer to start of dest */ unsigned long *pDstLine; /* poitner to start of dest box */ unsigned long *pSrcBase; /* pointer to start of source */ unsigned long *pSrcLine; /* pointer to start of source line */ register unsigned long *pDst; register unsigned long *pSrc; register unsigned long bits, tmp; register int nlwPart; int xoffStart, xoff; int leftShiftStart, rightShiftStart, nlwSrcStart; unsigned long tileEndMask; int tileEndLeftShift, tileEndRightShift; int xoffStep; int tileEndPart; int needFirst; unsigned long narrow[2]; unsigned long narrowMask; int narrowShift; Bool narrowTile; MROP_INITIALIZE (alu, planemask) tileHeight = tile->drawable.height; tileWidth = tile->drawable.width; tilePriv = (hpPrivPixmapPtr)tile->devPrivate.ptr; if (tile->devKind == PIXMAP_FRAME_BUFFER) widthSrc = tilePriv->pChunk->w >> 2; else widthSrc = tilePriv->stride >> 2; strideSrc = tilePriv->stride >> 2; narrowTile = FALSE; if (widthSrc == 1) { narrowShift = tileWidth; narrowMask = cfbendpartial [tileWidth]; tileWidth *= 2; widthSrc = 2; narrowTile = TRUE; } pSrcBase = (unsigned long *)tilePriv->bits; cfbGetLongWidthAndPointer (pDrawable, widthDst, pDstBase) SET_REGISTERS_FOR_WRITING(pDrawable->pScreen, ~0, GXcopy); if (tile->devKind == PIXMAP_FRAME_BUFFER) WAIT_READY_TO_RENDER(tile->drawable.pScreen); tileEndPart = tileWidth & PIM; tileEndMask = cfbendpartial[tileEndPart]; tileEndLeftShift = (tileEndPart) << (5-PWSH); tileEndRightShift = 32 - tileEndLeftShift; xoffStep = PPW - tileEndPart; while (n--) { w = *pwidth++; modulus (ppt->x - xrot, tileWidth, srcx); modulus (ppt->y - yrot, tileHeight, srcy); xoffDst = ppt->x & PIM; if (xoffDst + w < PPW) { maskpartialbits(ppt->x, w, startmask); endmask = 0; nlw = 0; } else { maskbits (ppt->x, w, startmask, endmask, nlw) } pDstLine = pDstBase + (ppt->y * widthDst) + (ppt->x >> PWSH); pSrcLine = pSrcBase + (srcy * strideSrc); xoffSrc = srcx & PIM; if (xoffSrc >= xoffDst) { xoffStart = xoffSrc - xoffDst; needFirst = 1; } else { xoffStart = PPW - (xoffDst - xoffSrc); needFirst = 0; } leftShiftStart = (xoffStart) << (5-PWSH); rightShiftStart = 32 - leftShiftStart; nlwSrcStart = widthSrc - (srcx >> PWSH); /* XXX only works when narrowShift >= PPW/2 */ if (narrowTile) { tmp = pSrcBase[srcy] & narrowMask; /* source width == 1 */ narrow[0] = tmp | SCRRIGHT (tmp, narrowShift); narrow[1] = SCRLEFT (tmp, PPW - narrowShift) | SCRRIGHT(tmp, 2 * narrowShift - PPW); pSrcLine = narrow; } xoff = xoffStart; leftShift = leftShiftStart; rightShift = rightShiftStart; nlwSrc = nlwSrcStart; pSrc = pSrcLine + (srcx >> PWSH); pDst = pDstLine; bits = 0; if (needFirst) { NextTileBits } if (startmask) { NextTileBits tmp = BitLeft(tmp, leftShift); if (rightShift != 32) tmp |= BitRight(bits,rightShift); *pDst = MROP_MASK (tmp, *pDst, startmask); ++pDst; } while (nlw) { #if MROP == Mcopy if (nlwSrc > 1) { nlwPart = nlw; if (nlwPart >= nlwSrc) nlwPart = nlwSrc - 1; nlw -= nlwPart; nlwSrc -= nlwPart; if (rightShift != 32) { while (nlwPart--) { tmp = bits; bits = *pSrc++; *pDst = MROP_SOLID(BitLeft(tmp, leftShift) | BitRight (bits, rightShift), *pDst); ++pDst; } } else { if (nlwPart) { *pDst = MROP_SOLID (bits, *pDst); ++pDst; nlwPart--; while (nlwPart--) { *pDst = MROP_SOLID(*pSrc, *pDst); ++pDst; ++pSrc; } bits = *pSrc++; } } } else #endif { NextTileBits if (rightShift != 32) { *pDst = MROP_SOLID(BitLeft(tmp, leftShift) | BitRight(bits, rightShift), *pDst); ++pDst; } else { *pDst = MROP_SOLID (tmp, *pDst); ++pDst; } nlw--; } } if (endmask) { NextTileBits if (rightShift == 32) bits = 0; *pDst = MROP_MASK (BitLeft(tmp, leftShift) | BitRight(bits,rightShift), *pDst, endmask); } ppt++; } } # include "fastblt.h" #define IncSrcPtr psrc++; if (!--srcRemaining) { srcRemaining = widthSrc; psrc = psrcStart; } MROP_NAME(cfbFillBoxTile32s) (pDrawable, nBox, pBox, tile, xrot, yrot, alu, planemask) DrawablePtr pDrawable; int nBox; /* number of boxes to fill */ register BoxPtr pBox; /* pointer to list of boxes to fill */ PixmapPtr tile; /* tile */ int xrot, yrot; int alu; unsigned long planemask; { hpPrivPixmapPtr tilePriv; int tileWidth; /* width of tile */ int tileHeight; /* height of the tile */ int widthSrc; /* width in longwords of the source tile */ int strideSrc; int widthDst; /* width in longwords of the dest pixmap */ int w; /* width of current box */ int h; /* height of current box */ unsigned long startmask; unsigned long endmask; /* masks for reggedy bits at either end of line */ int nlMiddle; /* number of longwords between sides of boxes */ register int nl; /* loop version of nlMiddle */ int srcy; /* current tile y position */ int srcx; /* current tile x position */ int srcRemaining; /* number of longwords remaining in source */ int xoffDst, xoffSrc; int srcStart; /* number of longwords source offset at left of box */ int leftShift, rightShift; MROP_DECLARE_REG() unsigned long *pdstBase; /* pointer to start of dest */ unsigned long *pdstLine; /* poitner to start of dest box */ unsigned long *psrcBase; /* pointer to start of source */ unsigned long *psrcLine; /* pointer to fetch point of source */ unsigned long *psrcStart; /* pointer to start of source line */ register unsigned long *pdst; register unsigned long *psrc; register unsigned long bits, bits1; register int nlTemp; MROP_INITIALIZE (alu, planemask) tilePriv = (hpPrivPixmapPtr)tile->devPrivate.ptr; psrcBase = (unsigned long *)tilePriv->bits; tileHeight = tile->drawable.height; tileWidth = tile->drawable.width; widthSrc = tileWidth >> PWSH; strideSrc = tilePriv->stride >> PWSH; cfbGetLongWidthAndPointer (pDrawable, widthDst, pdstBase) SET_REGISTERS_FOR_WRITING(pDrawable->pScreen, ~0, GXcopy); if (tile->devKind == PIXMAP_FRAME_BUFFER) WAIT_READY_TO_RENDER(tile->drawable.pScreen); while (nBox--) { w = pBox->x2 - pBox->x1; h = pBox->y2 - pBox->y1; /* set up source */ modulus (pBox->x1 - xrot, tileWidth, srcx); modulus (pBox->y1 - yrot, tileHeight, srcy); xoffSrc = srcx & PIM; srcStart = (srcx >> PWSH); psrcStart = psrcBase + (srcy * strideSrc); psrcLine = psrcStart + srcStart; /* set up dest */ xoffDst = pBox->x1 & PIM; pdstLine = pdstBase + (pBox->y1 * widthDst) + (pBox->x1 >> PWSH); /* set up masks */ if (xoffDst + w < PPW) { maskpartialbits(pBox->x1, w, startmask); endmask = 0; nlMiddle = 0; } else { maskbits (pBox->x1, w, startmask, endmask, nlMiddle) } if (xoffSrc == xoffDst) { while (h--) { psrc = psrcLine; pdst = pdstLine; srcRemaining = widthSrc - srcStart; if (startmask) { *pdst = MROP_MASK (*psrc, *pdst, startmask); pdst++; IncSrcPtr } nlTemp = nlMiddle; while (nlTemp) { nl = nlTemp; if (nl > srcRemaining) nl = srcRemaining; nlTemp -= nl; srcRemaining -= nl; #if MROP == Mcopy #ifdef LARGE_INSTRUCTION_CACHE #ifdef FAST_CONSTANT_OFFSET_MODE psrc += nl & (UNROLL-1); pdst += nl & (UNROLL-1); #define BodyOdd(n) pdst[-n] = MROP_SOLID (psrc[-n], pdst[-n]); #define BodyEven(n) pdst[-n] = MROP_SOLID (psrc[-n], pdst[-n]); #define LoopReset \ pdst += UNROLL; \ psrc += UNROLL; #else #define BodyOdd(n) *pdst = MROP_SOLID (*psrc, *pdst); pdst++; psrc++; #define BodyEven(n) BodyOdd(n) #define LoopReset ; #endif PackedLoop #undef BodyOdd #undef BodyEven #undef LoopReset #else DuffL(nl, label1, *pdst = MROP_SOLID (*psrc, *pdst); pdst++; psrc++;) #endif #else while (nl--) { *pdst = MROP_SOLID (*psrc, *pdst); pdst++; psrc++; } #endif if (!srcRemaining) { srcRemaining = widthSrc; psrc = psrcStart; } } if (endmask) { *pdst = MROP_MASK (*psrc, *pdst, endmask); } pdstLine += widthDst; psrcLine += strideSrc; psrcStart += strideSrc; if (++srcy == tileHeight) { psrcStart = psrcBase; psrcLine = psrcStart + srcStart; srcy = 0; } } } else { if (xoffSrc > xoffDst) { leftShift = (xoffSrc - xoffDst) << (5 - PWSH); rightShift = 32 - leftShift; } else { rightShift = (xoffDst - xoffSrc) << (5 - PWSH); leftShift = 32 - rightShift; } while (h--) { psrc = psrcLine; pdst = pdstLine; bits = 0; srcRemaining = widthSrc - srcStart; if (xoffSrc > xoffDst) { bits = *psrc; IncSrcPtr } if (startmask) { bits1 = BitLeft(bits,leftShift); bits = *psrc; IncSrcPtr bits1 |= BitRight(bits,rightShift); *pdst = MROP_MASK(bits1, *pdst, startmask); pdst++; } nlTemp = nlMiddle; while (nlTemp) { nl = nlTemp; if (nl > srcRemaining) nl = srcRemaining; nlTemp -= nl; srcRemaining -= nl; #if MROP == Mcopy #ifdef LARGE_INSTRUCTION_CACHE bits1 = bits; #ifdef FAST_CONSTANT_OFFSET_MODE psrc += nl & (UNROLL-1); pdst += nl & (UNROLL-1); #define BodyOdd(n) \ bits = psrc[-n]; \ pdst[-n] = MROP_SOLID(BitLeft(bits1, leftShift) | BitRight(bits, rightShift), pdst[-n]); #define BodyEven(n) \ bits1 = psrc[-n]; \ pdst[-n] = MROP_SOLID(BitLeft(bits, leftShift) | BitRight(bits1, rightShift), pdst[-n]); #define LoopReset \ pdst += UNROLL; \ psrc += UNROLL; #else #define BodyOdd(n) \ bits = *psrc++; \ *pdst = MROP_SOLID(BitLeft(bits1, leftShift) | BitRight(bits, rightShift), *pdst); \ pdst++; #define BodyEven(n) \ bits1 = *psrc++; \ *pdst = MROP_SOLID(BitLeft(bits, leftShift) | BitRight(bits1, rightShift), *pdst); \ pdst++; #define LoopReset ; #endif /* !FAST_CONSTANT_OFFSET_MODE */ PackedLoop #undef BodyOdd #undef BodyEven #undef LoopReset #else DuffL (nl,label2, bits1 = BitLeft(bits, leftShift); bits = *psrc++; *pdst = MROP_SOLID (bits1 | BitRight(bits, rightShift), *pdst); pdst++; ) #endif #else while (nl--) { bits1 = BitLeft(bits, leftShift); bits = *psrc++; *pdst = MROP_SOLID (bits1 | BitRight(bits, rightShift), *pdst); pdst++; } #endif if (!srcRemaining) { srcRemaining = widthSrc; psrc = psrcStart; } } if (endmask) { bits1 = BitLeft(bits, leftShift); if (BitLeft(endmask, rightShift)) { bits = *psrc; bits1 |= BitRight(bits, rightShift); } *pdst = MROP_MASK (bits1, *pdst, endmask); } pdstLine += widthDst; psrcLine += strideSrc; psrcStart += strideSrc; if (++srcy == tileHeight) { psrcStart = psrcBase; psrcLine = psrcStart + srcStart; srcy = 0; } } } pBox++; } } MROP_NAME(cfbFillSpanTile32s) (pDrawable, n, ppt, pwidth, tile, xrot, yrot, alu, planemask) DrawablePtr pDrawable; int n; DDXPointPtr ppt; int *pwidth; PixmapPtr tile; int xrot, yrot; int alu; unsigned long planemask; { hpPrivPixmapPtr tilePriv; int tileWidth; /* width of tile */ int tileHeight; /* height of the tile */ int widthSrc; /* width in longwords of the source tile */ int strideSrc; int widthDst; /* width in longwords of the dest pixmap */ int w; /* width of current box */ unsigned long startmask; unsigned long endmask; /* masks for reggedy bits at either end of line */ int nlMiddle; /* number of longwords between sides of boxes */ register int nl; /* loop version of nlMiddle */ int srcy; /* current tile y position */ int srcx; /* current tile x position */ int srcRemaining; /* number of longwords remaining in source */ int xoffDst, xoffSrc; int srcStart; /* number of longwords source offset at left of box */ int leftShift, rightShift; MROP_DECLARE_REG() unsigned long *pdstBase; /* pointer to start of dest */ unsigned long *pdstLine; /* poitner to start of dest box */ unsigned long *psrcBase; /* pointer to start of source */ unsigned long *psrcLine; /* pointer to fetch point of source */ unsigned long *psrcStart; /* pointer to start of source line */ register unsigned long *pdst; register unsigned long *psrc; register unsigned long bits, bits1; register int nlTemp; MROP_INITIALIZE (alu, planemask) tilePriv = (hpPrivPixmapPtr)tile->devPrivate.ptr; psrcBase = (unsigned long *)tilePriv->bits; tileHeight = tile->drawable.height; tileWidth = tile->drawable.width; widthSrc = tileWidth >> PWSH; strideSrc = tilePriv->stride >> PWSH; cfbGetLongWidthAndPointer (pDrawable, widthDst, pdstBase) SET_REGISTERS_FOR_WRITING(pDrawable->pScreen, ~0, GXcopy); if (tile->devKind == PIXMAP_FRAME_BUFFER) WAIT_READY_TO_RENDER(tile->drawable.pScreen); while (n--) { w = *pwidth++; /* set up source */ modulus (ppt->x - xrot, tileWidth, srcx); modulus (ppt->y - yrot, tileHeight, srcy); xoffSrc = srcx & PIM; srcStart = (srcx >> PWSH); psrcStart = psrcBase + (srcy * strideSrc); psrcLine = psrcStart + srcStart; /* set up dest */ xoffDst = ppt->x & PIM; pdstLine = pdstBase + (ppt->y * widthDst) + (ppt->x >> PWSH); /* set up masks */ if (xoffDst + w < PPW) { maskpartialbits(ppt->x, w, startmask); endmask = 0; nlMiddle = 0; } else { maskbits (ppt->x, w, startmask, endmask, nlMiddle) } if (xoffSrc == xoffDst) { psrc = psrcLine; pdst = pdstLine; srcRemaining = widthSrc - srcStart; if (startmask) { *pdst = MROP_MASK (*psrc, *pdst, startmask); pdst++; IncSrcPtr } nlTemp = nlMiddle; while (nlTemp) { nl = nlTemp; if (nl > srcRemaining) nl = srcRemaining; nlTemp -= nl; srcRemaining -= nl; #if MROP == Mcopy #ifdef LARGE_INSTRUCTION_CACHE #ifdef FAST_CONSTANT_OFFSET_MODE psrc += nl & (UNROLL-1); pdst += nl & (UNROLL-1); #define BodyOdd(n) pdst[-n] = MROP_SOLID (psrc[-n], pdst[-n]); #define BodyEven(n) pdst[-n] = MROP_SOLID (psrc[-n], pdst[-n]); #define LoopReset \ pdst += UNROLL; \ psrc += UNROLL; #else #define BodyOdd(n) *pdst = MROP_SOLID (*psrc, *pdst); pdst++; psrc++; #define BodyEven(n) BodyOdd(n) #define LoopReset ; #endif PackedLoop #undef BodyOdd #undef BodyEven #undef LoopReset #else DuffL(nl, label1, *pdst = MROP_SOLID (*psrc, *pdst); pdst++; psrc++;) #endif #else while (nl--) { *pdst = MROP_SOLID (*psrc, *pdst); pdst++; psrc++; } #endif if (!srcRemaining) { srcRemaining = widthSrc; psrc = psrcStart; } } if (endmask) { *pdst = MROP_MASK (*psrc, *pdst, endmask); } } else { if (xoffSrc > xoffDst) { leftShift = (xoffSrc - xoffDst) << (5 - PWSH); rightShift = 32 - leftShift; } else { rightShift = (xoffDst - xoffSrc) << (5 - PWSH); leftShift = 32 - rightShift; } psrc = psrcLine; pdst = pdstLine; bits = 0; srcRemaining = widthSrc - srcStart; if (xoffSrc > xoffDst) { bits = *psrc; IncSrcPtr } if (startmask) { bits1 = BitLeft(bits,leftShift); bits = *psrc; IncSrcPtr bits1 |= BitRight(bits,rightShift); *pdst = MROP_MASK(bits1, *pdst, startmask); pdst++; } nlTemp = nlMiddle; while (nlTemp) { nl = nlTemp; if (nl > srcRemaining) nl = srcRemaining; nlTemp -= nl; srcRemaining -= nl; #if MROP == Mcopy #ifdef LARGE_INSTRUCTION_CACHE bits1 = bits; #ifdef FAST_CONSTANT_OFFSET_MODE psrc += nl & (UNROLL-1); pdst += nl & (UNROLL-1); #define BodyOdd(n) \ bits = psrc[-n]; \ pdst[-n] = MROP_SOLID(BitLeft(bits1, leftShift) | BitRight(bits, rightShift), pdst[-n]); #define BodyEven(n) \ bits1 = psrc[-n]; \ pdst[-n] = MROP_SOLID(BitLeft(bits, leftShift) | BitRight(bits1, rightShift), pdst[-n]); #define LoopReset \ pdst += UNROLL; \ psrc += UNROLL; #else #define BodyOdd(n) \ bits = *psrc++; \ *pdst = MROP_SOLID(BitLeft(bits1, leftShift) | BitRight(bits, rightShift), *pdst); \ pdst++; #define BodyEven(n) \ bits1 = *psrc++; \ *pdst = MROP_SOLID(BitLeft(bits, leftShift) | BitRight(bits1, rightShift), *pdst); \ pdst++; #define LoopReset ; #endif /* !FAST_CONSTANT_OFFSET_MODE */ PackedLoop #undef BodyOdd #undef BodyEven #undef LoopReset #else DuffL (nl,label2, bits1 = BitLeft(bits, leftShift); bits = *psrc++; *pdst = MROP_SOLID (bits1 | BitRight(bits, rightShift), *pdst); pdst++; ) #endif #else while (nl--) { bits1 = BitLeft(bits,leftShift); bits = *psrc++; *pdst = MROP_SOLID(bits1|BitRight(bits,rightShift), *pdst); pdst++; } #endif if (!srcRemaining) { srcRemaining = widthSrc; psrc = psrcStart; } } if (endmask) { bits1 = BitLeft(bits, leftShift); if (BitLeft(endmask, rightShift)) { bits = *psrc; bits1 |= BitRight(bits, rightShift); } *pdst = MROP_MASK (bits1, *pdst, endmask); } } ppt++; } }