Leaked source code of windows server 2003
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
 
 
 
 
 
 

1307 lines
36 KiB

/******************************Module*Header*******************************\
* Module Name: srcblt24.cxx
*
* This contains the bitmap simulation functions that blt to a 24 bit/pel
* DIB surface.
*
* Created: 07-Feb-1991 19:27:49
* Author: Patrick Haluptzok patrickh
*
* Copyright (c) 1990-1999 Microsoft Corporation
*
\**************************************************************************/
#include "precomp.hxx"
// Turn off validations
#if 1
// On free builds, don't call any verification code:
#define VERIFYS16D24(psb)
#define VERIFYS32D24(psb)
#else
// On checked builds, verify the RGB conversions:
VOID VERIFYS16D24(PBLTINFO psb)
{
// We assume we are doing left to right top to bottom blting
ASSERTGDI(psb->xDir == 1, "vSrcCopyS16D24 - direction not left to right");
ASSERTGDI(psb->yDir == 1, "vSrcCopyS16D24 - direction not up to down");
// These are our holding variables
ULONG ulDst;
PUSHORT pusSrcTemp;
PBYTE pjDstTemp;
ULONG cxTemp;
PUSHORT pusSrc = (PUSHORT) (psb->pjSrc + (2 * psb->xSrcStart));
PBYTE pjDst = psb->pjDst + (psb->xDstStart * 3);
ULONG cx = psb->cx;
ULONG cy = psb->cy;
XLATE *pxlo = psb->pxlo;
ASSERTGDI(cy != 0, "ERROR: Src Move cy == 0");
while(1)
{
pusSrcTemp = pusSrc;
pjDstTemp = pjDst;
cxTemp = cx;
while(cxTemp--)
{
ulDst = pxlo->ulTranslate((ULONG) *(pusSrcTemp++));
if (*(pjDstTemp++) != (BYTE) ulDst)
RIP("RGB mis-match");
if (*(pjDstTemp++) != (BYTE) (ulDst >> 8))
RIP("RGB mis-match");
if (*(pjDstTemp++) != (BYTE) (ulDst >> 16))
RIP("RGB mis-match");
}
if (--cy)
{
pusSrc = (PUSHORT) (((PBYTE) pusSrc) + psb->lDeltaSrc);
pjDst += psb->lDeltaDst;
}
else
break;
}
}
VOID VERIFYS32D24(PBLTINFO psb)
{
// We assume we are doing left to right top to bottom blting
ASSERTGDI(psb->xDir == 1, "vSrcCopyS32D24 - direction not left to right");
ASSERTGDI(psb->yDir == 1, "vSrcCopyS32D24 - direction not up to down");
// These are our holding variables
ULONG ulDst;
PULONG pulSrcTemp;
PBYTE pjDstTemp;
ULONG cxTemp;
PULONG pulSrc = (PULONG) (psb->pjSrc + (4 * psb->xSrcStart));
PBYTE pjDst = psb->pjDst + (psb->xDstStart * 3);
ULONG cx = psb->cx;
ULONG cy = psb->cy;
XLATE *pxlo = psb->pxlo;
ASSERTGDI(cy != 0, "ERROR: Src Move cy == 0");
while(1)
{
pulSrcTemp = pulSrc;
pjDstTemp = pjDst;
cxTemp = cx;
if ((pxlo == NULL) || (pxlo->flXlate & XO_TRIVIAL))
{
while(cxTemp--)
{
ulDst = *(pulSrcTemp++);
if (*(pjDstTemp++) != (BYTE) ulDst)
RIP("RGB mis-match");
if (*(pjDstTemp++) != (BYTE) (ulDst >> 8))
RIP("RGB mis-match");
if (*(pjDstTemp++) != (BYTE) (ulDst >> 16))
RIP("RGB mis-match");
}
}
else
{
while(cxTemp--)
{
ulDst = pxlo->ulTranslate(*(pulSrcTemp++));
if (*(pjDstTemp++) != (BYTE) ulDst)
RIP("RGB mis-match");
if (*(pjDstTemp++) != (BYTE) (ulDst >> 8))
RIP("RGB mis-match");
if (*(pjDstTemp++) != (BYTE) (ulDst >> 16))
RIP("RGB mis-match");
}
}
if (--cy)
{
pulSrc = (PULONG) (((PBYTE) pulSrc) + psb->lDeltaSrc);
pjDst += psb->lDeltaDst;
}
else
break;
}
}
#endif
/*******************Public*Routine*****************\
* vSrcCopyS1D24
*
* There are three main loops in this function.
*
* The first loop deals with the full byte part mapping
* the Dst while fetching/shifting the matching 8 bits
* from the Src.
*
* The second loop deals with the left starting
* pixels.
*
* The third loop deals with the ending pixels.
*
* For the full bytes, we walk thru Src one byte at a time
* and expand to Dst.
*
* We expand the starting/ending pixels one bit
* at a time.
*
* History:
* 17-Oct-1994 -by- Lingyun Wang [lingyunw]
* Wrote it.
\**************************************************/
VOID vSrcCopyS1D24(PBLTINFO psb)
{
// We assume we are doing left to right top to bottom blting
ASSERTGDI(psb->xDir == 1, "vSrcCopyS1D24 - direction not left to right");
ASSERTGDI(psb->yDir == 1, "vSrcCopyS1D24 - direction not up to down");
BYTE jSrc; // holds a source byte
INT iDst; // Position in the first 8 Dst units
INT iSrc; // bit position in the first Src byte
PBYTE pjDst;
PBYTE pjSrc; // pointer to the Dst bytes
LONG xSrcEnd = psb->xSrcEnd;
LONG cy; // number of rows
LONG cx; // number of pixels
BYTE jAlignL; // alignment bits to the left
BYTE jAlignR; // alignment bits to the right
LONG cFullBytes; //number of full 8 bytes dealed with
BOOL bNextByte;
LONG xDstEnd = psb->xDstStart+psb->cx;
LONG lDeltaDst;
LONG lDeltaSrc;
ULONG ulB = (ULONG)(psb->pxlo->pulXlate[0]);
ULONG ulF = (ULONG)(psb->pxlo->pulXlate[1]);
UCHAR aucTable[8];
INT count;
PBYTE pjTable;
BOOL bNextSrc=TRUE;
ASSERTGDI(psb->cy != 0, "ERROR: Src Move cy == 0");
//DbgPrint ("vsrccopys1d24\n");
// Generate ulTable. 2 entries.
ULONG ulValB = ulB;
ULONG ulValF = ulF;
*(PULONG) aucTable = ulValB;
*(PULONG) (aucTable+4) = ulValF;
//Get Src and Dst start positions
iSrc = psb->xSrcStart & 0x0007;
iDst = psb->xDstStart & 0x0007;
if (iSrc < iDst)
jAlignL = 8 - (iDst - iSrc);
// If Dst starting point is ahead of Src
else
jAlignL = iSrc - iDst;
jAlignR = 8 - jAlignL;
cx=psb->cx;
lDeltaDst = psb->lDeltaDst;
lDeltaSrc = psb->lDeltaSrc;
// if there is a next 8 dwords
bNextByte = !((xDstEnd>>3) ==
(psb->xDstStart>>3));
// if Src and Dst are aligned, use a separete loop
// to obtain better performance;
// If not, we shift the Src bytes to match with
// the Dst - 1 bit expand to 3 bytes
if (bNextByte)
{
long iStrideSrc;
long iStrideDst;
PBYTE pjSrcEnd;
// Get first Dst full 8 dwords
pjDst = psb->pjDst + 3*((psb->xDstStart+7)&~0x07);
// Get the Src byte that matches the first Dst
// full 8 bytes
pjSrc = psb->pjSrc + ((psb->xSrcStart+((8-iDst)&0x07)) >> 3);
//Get the number of full bytes to expand
cFullBytes = (xDstEnd>>3)-((psb->xDstStart+7)>>3);
//the increment to the full byte on the next scan line
iStrideDst = lDeltaDst - cFullBytes*8*3;
iStrideSrc = lDeltaSrc - cFullBytes;
// deal with our special case
cy = psb->cy;
if (!jAlignL)
{
while (cy--)
{
pjSrcEnd = pjSrc + cFullBytes;
while (pjSrc != pjSrcEnd)
{
jSrc = *pjSrc++;
pjTable = aucTable + ((jSrc & 0x80) >> (7-2));
*(pjDst + 0) = *pjTable;
*(pjDst + 1) = *(pjTable+1);
*(pjDst + 2) = *(pjTable+2);
pjTable = aucTable + ((jSrc & 0x40) >> (6-2));
*(pjDst + 3) = *pjTable;
*(pjDst + 4) = *(pjTable+1);
*(pjDst + 5) = *(pjTable+2);
pjTable = aucTable + ((jSrc & 0x20) >> (5-2));
*(pjDst + 6) = *pjTable;
*(pjDst + 7) = *(pjTable+1);
*(pjDst + 8) = *(pjTable+2);
pjTable = aucTable + ((jSrc & 0x10) >> (4-2));
*(pjDst + 9) = *pjTable;
*(pjDst + 10) = *(pjTable+1);
*(pjDst + 11) = *(pjTable+2);
pjTable = aucTable + ((jSrc & 0x08) >> (3-2));
*(pjDst + 12) = *pjTable;
*(pjDst + 13) = *(pjTable+1);
*(pjDst + 14) = *(pjTable+2);
pjTable = aucTable + (jSrc & 0x04);
*(pjDst + 15) = *pjTable;
*(pjDst + 16) = *(pjTable+1);
*(pjDst + 17) = *(pjTable+2);
pjTable = aucTable + ((jSrc & 0x02) << 1);
*(pjDst + 18) = *pjTable;
*(pjDst + 19) = *(pjTable+1);
*(pjDst + 20) = *(pjTable+2);
pjTable = aucTable + ((jSrc & 0x01) << 2);
*(pjDst + 21) = *pjTable;
*(pjDst + 22) = *(pjTable+1);
*(pjDst + 23) = *(pjTable+2);
pjDst +=3*8;
}
pjDst += iStrideDst;
pjSrc += iStrideSrc;
}
} //end of if (!jAlignL)
else // if not aligned
// Here comes our general case for the main full
// bytes part
{
BYTE jRem; //remainder
while (cy--)
{
jRem = *pjSrc << jAlignL;
pjSrcEnd = pjSrc + cFullBytes;
while (pjSrc != pjSrcEnd)
{
jSrc = ((*(++pjSrc))>>jAlignR) | jRem;
pjTable = aucTable + ((jSrc & 0x80) >> (7-2));
*(pjDst + 0) = *pjTable;
*(pjDst + 1) = *(pjTable+1);
*(pjDst + 2) = *(pjTable+2);
pjTable = aucTable + ((jSrc & 0x40) >> (6-2));
*(pjDst + 3) = *pjTable;
*(pjDst + 4) = *(pjTable+1);
*(pjDst + 5) = *(pjTable+2);
pjTable = aucTable + ((jSrc & 0x20) >> (5-2));
*(pjDst + 6) = *pjTable;
*(pjDst + 7) = *(pjTable+1);
*(pjDst + 8) = *(pjTable+2);
pjTable = aucTable + ((jSrc & 0x10) >> (4-2));
*(pjDst + 9) = *pjTable;
*(pjDst + 10) = *(pjTable+1);
*(pjDst + 11) = *(pjTable+2);
pjTable = aucTable + ((jSrc & 0x08) >> (3-2));
*(pjDst + 12) = *pjTable;
*(pjDst + 13) = *(pjTable+1);
*(pjDst + 14) = *(pjTable+2);
pjTable = aucTable + (jSrc & 0x04);
*(pjDst + 15) = *pjTable;
*(pjDst + 16) = *(pjTable+1);
*(pjDst + 17) = *(pjTable+2);
pjTable = aucTable + ((jSrc & 0x02) << 1);
*(pjDst + 18) = *pjTable;
*(pjDst + 19) = *(pjTable+1);
*(pjDst + 20) = *(pjTable+2);
pjTable = aucTable + ((jSrc & 0x01) << 2);
*(pjDst + 21) = *pjTable;
*(pjDst + 22) = *(pjTable+1);
*(pjDst + 23) = *(pjTable+2);
pjDst +=3*8;
//next remainder
jRem = *pjSrc << jAlignL;
}
// go to the beginging full byte of
// next scan line
pjDst += iStrideDst;
pjSrc += iStrideSrc;
}
} //else
} //if
// End of our dealing with the full bytes
// Begin dealing with the left strip of the
// starting pixels
if (!bNextByte)
{
count = cx;
bNextSrc = ((iSrc+cx) > 8);
}
else
count = 8-iDst;
if (iDst | !bNextByte)
{
PBYTE pjDstTemp;
PBYTE pjDstEnd;
pjDst = psb->pjDst + 3*psb->xDstStart;
pjSrc = psb->pjSrc + (psb->xSrcStart>>3);
cy = psb->cy;
if (iSrc > iDst)
{
if (bNextSrc)
{
while (cy--)
{
jSrc = *pjSrc << jAlignL;
jSrc |= *(pjSrc+1) >> jAlignR;
jSrc <<= iDst;
pjDstTemp = pjDst;
pjDstEnd = pjDst + 3*count;
while (pjDstTemp != pjDstEnd)
{
pjTable = aucTable + ((jSrc & 0x80) >> (7-2));
*(pjDstTemp + 0) = *pjTable;
*(pjDstTemp + 1) = *(pjTable+1);
*(pjDstTemp + 2) = *(pjTable+2);
jSrc <<= 1;
pjDstTemp += 3;
}
pjDst += lDeltaDst;
pjSrc += lDeltaSrc;
}
}
else
{
while (cy--)
{
jSrc = *pjSrc << jAlignL;
jSrc <<= iDst;
pjDstTemp = pjDst;
pjDstEnd = pjDst + 3*count;
while (pjDstTemp != pjDstEnd)
{
pjTable = aucTable + ((jSrc & 0x80) >> (7-2));
*(pjDstTemp + 0) = *pjTable;
*(pjDstTemp + 1) = *(pjTable+1);
*(pjDstTemp + 2) = *(pjTable+2);
jSrc <<= 1;
pjDstTemp += 3;
}
pjDst += lDeltaDst;
pjSrc += lDeltaSrc;
}
}
}
else //if (iSrc <= iDst)
{
while (cy--)
{
jSrc = *pjSrc << iSrc;
pjDstTemp = pjDst;
pjDstEnd = pjDst + 3*count;
while (pjDstTemp != pjDstEnd)
{
pjTable = aucTable + ((jSrc & 0x80) >> (7-2));
*(pjDstTemp + 0) = *pjTable;
*(pjDstTemp + 1) = *(pjTable+1);
*(pjDstTemp + 2) = *(pjTable+2);
jSrc <<= 1;
pjDstTemp += 3;
}
pjDst += lDeltaDst;
pjSrc += lDeltaSrc;
}
}
} //if
// Begin dealing with the right edge
// of partial 8 bytes
// first check if there is any partial
// byte left
// and has next 8 bytes
if ((xDstEnd & 0x0007)
&& bNextByte)
{
PBYTE pjDstTemp;
PBYTE pjDstEnd;
// Get the last partial bytes on the
// scan line
pjDst = psb->pjDst+ 3*(xDstEnd&~0x07);
// Get the Src byte that matches the
// right partial Dst 8 bytes
pjSrc = psb->pjSrc + ((psb->xSrcEnd-1) >>3);
// Get the ending position in the last
// Src and Dst bytes
iSrc = (psb->xSrcEnd-1) & 0x0007;
iDst = (xDstEnd-1) & 0x0007;
count = iDst+1;
cy = psb->cy;
if (iSrc >= iDst)
{
while (cy--)
{
jSrc = *pjSrc << jAlignL;
pjDstTemp = pjDst;
pjDstEnd = pjDst + 3*count;
while (pjDstTemp != pjDstEnd)
{
pjTable = aucTable + ((jSrc & 0x80) >> (7-2));
*(pjDstTemp + 0) = *pjTable;
*(pjDstTemp + 1) = *(pjTable+1);
*(pjDstTemp + 2) = *(pjTable+2);
jSrc <<= 1;
pjDstTemp += 3;
}
pjDst += lDeltaDst;
pjSrc += lDeltaSrc;
}
}
else //if (iSrc < iDst)
{
while (cy--)
{
jSrc = *(pjSrc-1) << jAlignL;
jSrc |= *pjSrc >> jAlignR;
pjDstTemp = pjDst;
pjDstEnd = pjDst + 3*count;
while (pjDstTemp != pjDstEnd)
{
pjTable = aucTable + ((jSrc & 0x80) >> (7-2));
*(pjDstTemp + 0) = *pjTable;
*(pjDstTemp + 1) = *(pjTable+1);
*(pjDstTemp + 2) = *(pjTable+2);
jSrc <<= 1;
pjDstTemp += 3;
}
pjDst += lDeltaDst;
pjSrc += lDeltaSrc;
}
}
} //if
}
/******************************Public*Routine******************************\
* vSrcCopyS4D24
*
*
* History:
* 18-Feb-1991 -by- Patrick Haluptzok patrickh
* Wrote it.
\**************************************************************************/
VOID vSrcCopyS4D24(PBLTINFO psb)
{
// We assume we are doing left to right top to bottom blting.
// If it was on the same surface we would be doing the identity case.
ASSERTGDI(psb->xDir == 1, "vSrcCopyS8D24 - direction not left to right");
ASSERTGDI(psb->yDir == 1, "vSrcCopyS8D24 - direction not up to down");
// These are our holding variables
#if MESSAGE_BLT
DbgPrint("Now entering vSrcCopyS8D24\n");
#endif
PBYTE pjSrc = psb->pjSrc + (psb->xSrcStart >> 1);
PBYTE pjDst = psb->pjDst + (psb->xDstStart * 3);
ULONG cx = psb->cx;
ULONG cy = psb->cy;
PULONG pulXlate = psb->pxlo->pulXlate;
PBYTE pjDstTemp;
PBYTE pjSrcTemp;
ULONG cStartPixels;
ULONG cMiddlePixels;
ULONG cEndPixels;
ULONG i,j;
ULONG ul;
ULONG ul0, ul1,ul2,ul3;
ASSERTGDI(cy != 0, "ERROR: Src Move cy == 0");
// 'cStartPixels' is the minimum number of 3-byte pixels we'll have to
// write before we have dword alignment on the destination:
cStartPixels = (ULONG)((ULONG_PTR) pjDst) & 3;
if (cStartPixels > cx)
{
cStartPixels = cx;
}
cx -= cStartPixels;
cMiddlePixels = cx >> 2;
cEndPixels = cx & 3;
while(1)
{
// Write pixels a byte at a time until we're 'dword' aligned on
// the destination:
j = psb->xSrcStart;
pjDstTemp = pjDst;
pjSrcTemp = pjSrc;
for (i = cStartPixels; i != 0; i--)
{
if (j & 0x00000001)
{
ul = pulXlate[*pjSrcTemp & 0x0F];
pjSrcTemp++;
}
else
{
ul = pulXlate[(((ULONG) (*pjSrcTemp & 0xF0)) >> 4)];
}
*(pjDstTemp) = (BYTE) ul;
*(pjDstTemp + 1) = (BYTE) (ul >> 8);
*(pjDstTemp + 2) = (BYTE) (ul >> 16);
j++;
pjDstTemp += 3;
}
//
// grab 4 pixles at a time
//
for (i = cMiddlePixels; i != 0; i--)
{
if (j & 0x00000001)
{
ul0 = pulXlate[(*pjSrcTemp & 0x0F)];
pjSrcTemp++;
ul1 = pulXlate[(((ULONG) (*pjSrcTemp & 0xF0)) >> 4)];
ul2 = pulXlate[((ULONG) (*pjSrcTemp & 0x0F))];
pjSrcTemp++;
ul3 = pulXlate[((ULONG) (*pjSrcTemp & 0xF0)) >> 4];
}
else
{
ul0 = pulXlate[(((ULONG) (*pjSrcTemp & 0xF0)) >> 4)];
ul1 = pulXlate[((ULONG) (*pjSrcTemp & 0x0F))];
pjSrcTemp++;
ul2 = pulXlate[(((ULONG) (*pjSrcTemp & 0xF0)) >> 4)];
ul3 = pulXlate[((ULONG) (*pjSrcTemp & 0x0F))];
pjSrcTemp++;
}
*((ULONG*) (pjDstTemp)) = ul0 | (ul1 << 24);
*((ULONG*) (pjDstTemp + 4)) = (ul1 >> 8) | (ul2 << 16);
*((ULONG*) (pjDstTemp + 8)) = (ul3 << 8) | (ul2 >> 16);
j += 4;
pjDstTemp += 12;
}
// Take care of the end alignment:
for (i = cEndPixels; i != 0; i--)
{
if (j & 0x00000001)
{
ul = pulXlate[*pjSrcTemp & 0x0F];
pjSrcTemp++;
}
else
{
ul = pulXlate[(((ULONG) (*pjSrcTemp & 0xF0)) >> 4)];
}
*(pjDstTemp) = (BYTE) ul;
*(pjDstTemp + 1) = (BYTE) (ul >> 8);
*(pjDstTemp + 2) = (BYTE) (ul >> 16);
j++;
pjDstTemp += 3;
}
if (--cy == 0)
break;
pjSrc += psb->lDeltaSrc;
pjDst += psb->lDeltaDst;
}
}
/******************************Public*Routine******************************\
* vSrcCopyS8D24
*
*
* History:
* 18-Feb-1991 -by- Patrick Haluptzok patrickh
* Wrote it.
\**************************************************************************/
VOID vSrcCopyS8D24(PBLTINFO psb)
{
// We assume we are doing left to right top to bottom blting.
// If it was on the same surface we would be doing the identity case.
ASSERTGDI(psb->xDir == 1, "vSrcCopyS8D24 - direction not left to right");
ASSERTGDI(psb->yDir == 1, "vSrcCopyS8D24 - direction not up to down");
// These are our holding variables
#if MESSAGE_BLT
DbgPrint("Now entering vSrcCopyS8D24\n");
#endif
PBYTE pjSrc = psb->pjSrc + psb->xSrcStart;
PBYTE pjDst = psb->pjDst + (psb->xDstStart * 3);
ULONG cx = psb->cx;
ULONG cy = psb->cy;
PULONG pulXlate = psb->pxlo->pulXlate;
LONG lSrcSkip = psb->lDeltaSrc - cx;
LONG lDstSkip = psb->lDeltaDst - (cx * 3);
ULONG cStartPixels;
ULONG cMiddlePixels;
ULONG cEndPixels;
ULONG i;
ULONG ul;
ULONG ul0;
ULONG ul1;
ASSERTGDI(cy != 0, "ERROR: Src Move cy == 0");
// 'cStartPixels' is the minimum number of 3-byte pixels we'll have to
// write before we have dword alignment on the destination:
cStartPixels = (ULONG)((ULONG_PTR) pjDst) & 3;
if (cStartPixels > cx)
{
cStartPixels = cx;
}
cx -= cStartPixels;
cMiddlePixels = cx >> 2;
cEndPixels = cx & 3;
while(1)
{
// Write pixels a byte at a time until we're 'dword' aligned on
// the destination:
for (i = cStartPixels; i != 0; i--)
{
ul = pulXlate[*pjSrc];
*(pjDst) = (BYTE) ul;
*(pjDst + 1) = (BYTE) (ul >> 8);
*(pjDst + 2) = (BYTE) (ul >> 16);
pjSrc += 1;
pjDst += 3;
}
// Now write pixels a dword at a time. This is almost a 4x win
// over doing byte writes if we're writing to frame buffer memory
// over the PCI bus on Pentium class systems, because the PCI
// write throughput is so slow:
for (i = cMiddlePixels; i != 0; i--)
{
ul0 = (pulXlate[*(pjSrc)]);
ul1 = (pulXlate[*(pjSrc + 1)]);
*((ULONG*) (pjDst)) = ul0 | (ul1 << 24);
ul0 = (pulXlate[*(pjSrc + 2)]);
*((ULONG*) (pjDst + 4)) = (ul1 >> 8) | (ul0 << 16);
ul1 = (pulXlate[*(pjSrc + 3)]);
*((ULONG*) (pjDst + 8)) = (ul1 << 8) | (ul0 >> 16);
pjSrc += 4;
pjDst += 12;
}
// Take care of the end alignment:
for (i = cEndPixels; i != 0; i--)
{
ul = pulXlate[*pjSrc];
*(pjDst) = (BYTE) ul;
*(pjDst + 1) = (BYTE) (ul >> 8);
*(pjDst + 2) = (BYTE) (ul >> 16);
pjSrc += 1;
pjDst += 3;
}
if (--cy == 0)
break;
pjSrc += lSrcSkip;
pjDst += lDstSkip;
}
}
/******************************Public*Routine******************************\
* vSrcCopyS16D24
*
*
* History:
* 07-Feb-1991 -by- Patrick Haluptzok patrickh
* Wrote it.
\**************************************************************************/
VOID vSrcCopyS16D24(PBLTINFO psb)
{
// We assume we are doing left to right top to bottom blting
ASSERTGDI(psb->xDir == 1, "vSrcCopyS16D24 - direction not left to right");
ASSERTGDI(psb->yDir == 1, "vSrcCopyS16D24 - direction not up to down");
// These are our holding variables
PBYTE pjSrc = psb->pjSrc + (2 * psb->xSrcStart);
PBYTE pjDst = psb->pjDst + (3 * psb->xDstStart);
ULONG cx = psb->cx;
ULONG cy = psb->cy;
XLATE *pxlo = psb->pxlo;
LONG lSrcSkip = psb->lDeltaSrc - (cx * 2);
LONG lDstSkip = psb->lDeltaDst - (cx * 3);
PFN_pfnXlate pfnXlate = pxlo->pfnXlateBetweenBitfields();
ULONG cStartPixels;
ULONG cMiddlePixels;
ULONG cEndPixels;
ULONG ul;
ULONG ul0;
ULONG ul1;
LONG i;
ASSERTGDI(cy != 0, "ERROR: Src Move cy == 0");
// 'cStartPixels' is the minimum number of 3-byte pixels we'll have to
// write before we have dword alignment on the destination:
cStartPixels = (ULONG)((ULONG_PTR) pjDst) & 3;
if (cStartPixels > cx)
{
cStartPixels = cx;
}
cx -= cStartPixels;
cMiddlePixels = cx >> 2;
cEndPixels = cx & 3;
while (1)
{
for (i = cStartPixels; i != 0; i--)
{
ul = pfnXlate(pxlo, *((USHORT*) pjSrc));
*(pjDst) = (BYTE) (ul);
*(pjDst + 1) = (BYTE) (ul >> 8);
*(pjDst + 2) = (BYTE) (ul >> 16);
pjSrc += 2;
pjDst += 3;
}
for (i = cMiddlePixels; i != 0; i--)
{
ul0 = pfnXlate(pxlo, *((USHORT*) (pjSrc)));
ul1 = pfnXlate(pxlo, *((USHORT*) (pjSrc + 2)));
*((ULONG*) (pjDst)) = ul0 | (ul1 << 24);
ul0 = pfnXlate(pxlo, *((USHORT*) (pjSrc + 4)));
*((ULONG*) (pjDst + 4)) = (ul1 >> 8) | (ul0 << 16);
ul1 = pfnXlate(pxlo, *((USHORT*) (pjSrc + 6)));
*((ULONG*) (pjDst + 8)) = (ul1 << 8) | (ul0 >> 16);
pjSrc += 8;
pjDst += 12;
}
for (i = cEndPixels; i != 0; i--)
{
ul = pfnXlate(pxlo, *((USHORT*) pjSrc));
*(pjDst) = (BYTE) (ul);
*(pjDst + 1) = (BYTE) (ul >> 8);
*(pjDst + 2) = (BYTE) (ul >> 16);
pjSrc += 2;
pjDst += 3;
}
if (--cy == 0)
break;
pjSrc += lSrcSkip;
pjDst += lDstSkip;
}
VERIFYS16D24(psb);
}
/******************************Public*Routine******************************\
* vSrcCopyS24D24
*
*
* History:
* 18-Feb-1991 -by- Patrick Haluptzok patrickh
* Wrote it.
\**************************************************************************/
VOID vSrcCopyS24D24(PBLTINFO psb)
{
// We assume we are doing left to right top to bottom blting
ASSERTGDI(psb->xDir == 1, "vSrcCopyS24D24 - direction not left to right");
ASSERTGDI(psb->yDir == 1, "vSrcCopyS24D24 - direction not up to down");
// These are our holding variables
#if MESSAGE_BLT
DbgPrint("Now entering vSrcCopyS8D24\n");
#endif
PBYTE pjSrcTemp;
PBYTE pjDstTemp;
PBYTE pjSrc = psb->pjSrc + (psb->xSrcStart * 3);
PBYTE pjDst = psb->pjDst + (psb->xDstStart * 3);
ULONG cx = psb->cx;
ULONG cy = psb->cy;
XLATE *pxlo = psb->pxlo;
ULONG cStartPixels;
ULONG cMiddlePixels;
ULONG cEndPixels;
ULONG i,j;
ULONG ul;
ULONG ul0,ul1,ul2,ul3;
ASSERTGDI(cy != 0, "ERROR: Src Move cy == 0");
// 'cStartPixels' is the minimum number of 3-byte pixels we'll have to
// write before we have dword alignment on the destination:
cStartPixels = (ULONG)((ULONG_PTR) pjDst) & 3;
if (cStartPixels > cx)
{
cStartPixels = cx;
}
cx -= cStartPixels;
cMiddlePixels = cx >> 2;
cEndPixels = cx & 3;
while(1)
{
// Write pixels a byte at a time until we're 'dword' aligned on
// the destination:
j = psb->xSrcStart;
pjDstTemp = pjDst;
pjSrcTemp = pjSrc;
for (i = cStartPixels; i != 0; i--)
{
ul = (ULONG) *(pjSrcTemp + 2);
ul = ul << 8;
ul |= (ULONG) *(pjSrcTemp + 1);
ul = ul << 8;
ul |= (ULONG) *pjSrcTemp;
ul = pxlo->ulTranslate(ul);
*(pjDstTemp++) = (BYTE) ul;
*(pjDstTemp++) = (BYTE) (ul >> 8);
*(pjDstTemp++) = (BYTE) (ul >> 16);
pjSrcTemp += 3;
}
//
// grab 4 pixles at a time
//
for (i = cMiddlePixels; i != 0; i--)
{
ul0 = (ULONG) *(pjSrcTemp + 2);
ul0 = ul0 << 8;
ul0 |= (ULONG) *(pjSrcTemp + 1);
ul0 = ul0 << 8;
ul0 |= (ULONG) *pjSrcTemp;
ul0 = pxlo->ulTranslate(ul0);
pjSrcTemp += 3;
ul1 = (ULONG) *(pjSrcTemp + 2);
ul1 = ul1 << 8;
ul1 |= (ULONG) *(pjSrcTemp + 1);
ul1 = ul1 << 8;
ul1 |= (ULONG) *pjSrcTemp;
ul1 = pxlo->ulTranslate(ul1);
pjSrcTemp += 3;
ul2 = (ULONG) *(pjSrcTemp + 2);
ul2 = ul2 << 8;
ul2 |= (ULONG) *(pjSrcTemp + 1);
ul2 = ul2 << 8;
ul2 |= (ULONG) *pjSrcTemp;
ul2 = pxlo->ulTranslate(ul2);
pjSrcTemp += 3;
ul3 = (ULONG) *(pjSrcTemp + 2);
ul3 = ul3 << 8;
ul3 |= (ULONG) *(pjSrcTemp + 1);
ul3 = ul3 << 8;
ul3 |= (ULONG) *pjSrcTemp;
ul3 = pxlo->ulTranslate(ul3);
pjSrcTemp += 3;
*((ULONG*) (pjDstTemp)) = ul0 | (ul1 << 24);
*((ULONG*) (pjDstTemp + 4)) = (ul1 >> 8) | (ul2 << 16);
*((ULONG*) (pjDstTemp + 8)) = (ul3 << 8) | (ul2 >> 16);
pjDstTemp += 12;
}
// Take care of the end alignment:
for (i = cEndPixels; i != 0; i--)
{
ul = (ULONG) *(pjSrcTemp + 2);
ul = ul << 8;
ul |= (ULONG) *(pjSrcTemp + 1);
ul = ul << 8;
ul |= (ULONG) *pjSrcTemp;
ul = pxlo->ulTranslate(ul);
*(pjDstTemp++) = (BYTE) ul;
*(pjDstTemp++) = (BYTE) (ul >> 8);
*(pjDstTemp++) = (BYTE) (ul >> 16);
pjSrcTemp += 3;
}
if (--cy == 0)
break;
pjSrc += psb->lDeltaSrc;
pjDst += psb->lDeltaDst;
}
}
/******************************Public*Routine******************************\
* vSrcCopyS24D24Identity
*
* This is the special case no translate blting. All the SmDn should have
* them if m==n. Identity xlates only occur amoung matching format bitmaps
* and screens.
*
* History:
* 18-Feb-1991 -by- Patrick Haluptzok patrickh
* Wrote it.
\**************************************************************************/
VOID vSrcCopyS24D24Identity(PBLTINFO psb)
{
PBYTE pjSrc = psb->pjSrc + (psb->xSrcStart * 3);
PBYTE pjDst = psb->pjDst + (psb->xDstStart * 3);
ULONG cx = psb->cx * 3;
ULONG cy = psb->cy;
ASSERTGDI(cy != 0, "ERROR: Src Move cy == 0");
#if MESSAGE_BLT
DbgPrint("xdir: %ld cy: %lu xSrcStart %lu xDstStart %lu xSrcEnd %lu cx %lu\n",
psb->xDir, cy, psb->xSrcStart, psb->xDstStart, psb->xSrcEnd, cx);
#endif
if (psb->xDir < 0)
{
pjSrc -= (cx - 3);
pjDst -= (cx - 3);
}
while(1)
{
if(psb->fSrcAlignedRd)
vSrcAlignCopyMemory(pjDst, pjSrc, cx);
else
RtlMoveMemory((PVOID)pjDst, (PVOID)pjSrc, cx);
if (--cy)
{
pjSrc += psb->lDeltaSrc;
pjDst += psb->lDeltaDst;
}
else
break;
}
}
/******************************Public*Routine******************************\
* vSrcCopyS32D24
*
*
* History:
* 07-Feb-1991 -by- Patrick Haluptzok patrickh
* Wrote it.
\**************************************************************************/
VOID vSrcCopyS32D24(PBLTINFO psb)
{
// We assume we are doing left to right top to bottom blting
ASSERTGDI(psb->xDir == 1, "vSrcCopyS32D24 - direction not left to right");
ASSERTGDI(psb->yDir == 1, "vSrcCopyS32D24 - direction not up to down");
// These are our holding variables
PBYTE pjSrc = psb->pjSrc + (4 * psb->xSrcStart);
PBYTE pjDst = psb->pjDst + (3 * psb->xDstStart);
ULONG cx = psb->cx;
ULONG cy = psb->cy;
XLATE *pxlo = psb->pxlo;
XEPALOBJ palSrc(pxlo->ppalSrc);
XEPALOBJ palDst(pxlo->ppalDst);
LONG lSrcSkip = psb->lDeltaSrc - (cx * 4);
LONG lDstSkip = psb->lDeltaDst - (cx * 3);
PFN_pfnXlate pfnXlate;
ULONG cStartPixels;
ULONG cMiddlePixels;
ULONG cEndPixels;
ULONG ul;
ULONG ul0;
ULONG ul1;
LONG i;
ASSERTGDI(cy != 0, "ERROR: Src Move cy == 0");
if (palSrc.bIsBGR() && palDst.bIsBGR())
{
// 'cStartPixels' is the minimum number of 3-byte pixels we'll have to
// write before we have dword alignment on the destination:
cStartPixels = (ULONG)((ULONG_PTR) pjDst) & 3;
if (cStartPixels > cx)
{
cStartPixels = cx;
}
cx -= cStartPixels;
cMiddlePixels = cx >> 2;
cEndPixels = cx & 3;
while (1)
{
for (i = cStartPixels; i != 0; i--)
{
*(pjDst) = *(pjSrc);
*(pjDst + 1) = *(pjSrc + 1);
*(pjDst + 2) = *(pjSrc + 2);
pjSrc += 4;
pjDst += 3;
}
for (i = cMiddlePixels; i != 0; i--)
{
ul0 = *((ULONG *) (pjSrc));
ul1 = *((ULONG *) (pjSrc + 4));
*((ULONG*) (pjDst)) = (ul0 & 0xffffff) | (ul1 << 24);
ul0 = *((ULONG *) (pjSrc + 8));
*((ULONG*) (pjDst + 4)) = ((ul1 >> 8) & 0xffff) | (ul0 << 16);
ul1 = *((ULONG *) (pjSrc + 12));
*((ULONG*) (pjDst + 8)) = (ul1 << 8) | ((ul0 >> 16) & 0xff);
pjSrc += 16;
pjDst += 12;
}
for (i = cEndPixels; i != 0; i--)
{
*(pjDst) = *(pjSrc);
*(pjDst + 1) = *(pjSrc + 1);
*(pjDst + 2) = *(pjSrc + 2);
pjSrc += 4;
pjDst += 3;
}
if (--cy == 0)
break;
pjSrc += lSrcSkip;
pjDst += lDstSkip;
}
VERIFYS32D24(psb);
return;
}
pfnXlate = pxlo->pfnXlateBetweenBitfields();
while (1)
{
i = cx;
do {
ul = pfnXlate(pxlo, *((ULONG*) pjSrc));
*(pjDst) = (BYTE) (ul);
*(pjDst + 1) = (BYTE) (ul >> 8);
*(pjDst + 2) = (BYTE) (ul >> 16);
pjSrc += 4;
pjDst += 3;
} while (--i != 0);
if (--cy == 0)
break;
pjSrc += lSrcSkip;
pjDst += lDstSkip;
}
VERIFYS32D24(psb);
}