You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
5549 lines
188 KiB
5549 lines
188 KiB
/******************************************************************************\
|
|
*
|
|
* Copyright (c) 1996-1997 Microsoft Corporation.
|
|
* Copyright (c) 1996-1997 Cirrus Logic, Inc.
|
|
*
|
|
* Module Name:
|
|
*
|
|
* D D R A W . C
|
|
*
|
|
*
|
|
* Implements all the DirectDraw components for the driver.
|
|
*
|
|
*
|
|
* $Log: S:/projects/drivers/ntsrc/display/ddraw.c_v $
|
|
*
|
|
* Rev 1.14 07 Apr 1997 11:37:02 PLCHU
|
|
*
|
|
*
|
|
* Rev 1.13 Apr 03 1997 15:38:44 unknown
|
|
*
|
|
*
|
|
*
|
|
* Rev 1.10 Jan 14 1997 15:15:12 unknown
|
|
* Add new double clock detecting method.
|
|
*
|
|
* Rev 1.8 Jan 08 1997 11:23:34 unknown
|
|
* Add 2x clock support and double scan line counter support
|
|
*
|
|
* Rev 1.7 Dec 17 1996 18:31:12 unknown
|
|
* Update the bandwidth equation again.
|
|
*
|
|
* Rev 1.6 Dec 13 1996 12:15:04 unknown
|
|
* update bandwith equation.
|
|
*
|
|
* Rev 1.5 Dec 12 1996 11:09:52 unknown
|
|
* Add double scan line counter support
|
|
*
|
|
* Rev 1.5 Dec 12 1996 11:02:12 unknown
|
|
* Add double scan line counter support.
|
|
*
|
|
* Rev 1.5 Nov 26 1996 14:29:58 unknown
|
|
* Turn off the video window before the moving and then turn it on.
|
|
*
|
|
* Rev 1.4 Nov 25 1996 14:39:32 unknown
|
|
* Fixed AVI file playback and 16bpp transparent Blt bugs.
|
|
*
|
|
* Rev 1.4 Nov 18 1996 13:58:58 JACKIEC
|
|
*
|
|
*
|
|
* Rev 1.3 Nov 07 1996 16:47:56 unknown
|
|
*
|
|
*
|
|
* Rev 1.2 Oct 16 1996 14:41:04 unknown
|
|
* NT 3.51 does not have DDRAW support, So turn off overlay.h in NT 3.51
|
|
*
|
|
* Rev 1.1 Oct 10 1996 15:36:28 unknown
|
|
*
|
|
*
|
|
* Rev 1.10 12 Aug 1996 16:51:04 frido
|
|
* Added NT 3.5x/4.0 auto detection.
|
|
*
|
|
* Rev 1.9 06 Aug 1996 18:37:12 frido
|
|
* DirectDraw works! Video mapping is the key!
|
|
*
|
|
* Rev 1.8 24 Jul 1996 14:38:44 frido
|
|
* Cleaned up font cache after DirectDraw is done.
|
|
*
|
|
* Rev 1.7 24 Jul 1996 14:30:04 frido
|
|
* Added a call to destroy all cached fonts to make more room.
|
|
*
|
|
* Rev 1.6 20 Jul 1996 00:00:44 frido
|
|
* Fixed filling of DirectDraw in 24-bpp.
|
|
* Changed off-screen alignment to 4 bytes.
|
|
* Added compile switch to manage DirectDraw support in 24-bpp.
|
|
*
|
|
* Rev 1.5 16 Jul 1996 18:55:22 frido
|
|
* Fixed DirectDraw in 24-bpp mode.
|
|
*
|
|
* Rev 1.4 15 Jul 1996 18:03:22 frido
|
|
* Changed CP_MM_DST_ADDR to CP_MM_DST_ADDR_ABS.
|
|
*
|
|
* Rev 1.3 15 Jul 1996 10:58:28 frido
|
|
* Changed back to S3 base.
|
|
*
|
|
* Rev 1.1 09 Jul 1996 14:52:30 frido
|
|
* Only support chips 5436 and 5446.
|
|
*
|
|
* Rev 1.0 03 Jul 1996 13:53:02 frido
|
|
* Ported from S3 DirectDraw code.
|
|
*
|
|
* jl01 10-08-96 Do Transparent BLT w/o Solid Fill. Refer to PDRs#5511/6817.
|
|
*
|
|
* chu01 11-17-96 For 24-bpp, aligned destination boundary/size values are
|
|
* wrong. Refer to PDR#7312.
|
|
*
|
|
* sge01 11-19-96 Write CR37 at last For 5480.
|
|
*
|
|
*
|
|
* sge02 11-21-96 We have to set the Color Expand Width even in
|
|
* non-expand transparency mode.
|
|
*
|
|
*
|
|
* sge03 12-04-96 Add double scan line counter support .
|
|
*
|
|
* sge04 12-13-96 Change bandwidth for 5446BE and later chips.
|
|
*
|
|
* sge05 01-07-97 Use dword align for double clock mode.
|
|
*
|
|
* chu02 01-08-97 Disable ActiveX/Active Movie Player for interlaced modes.
|
|
* Refer to PDR#7312, 7866.
|
|
*
|
|
* jc01 10-18-96 Port Microsoft recent change.
|
|
* tao1 10-21-96 Added direct draw support for CL-GD7555.
|
|
* myf21 11-21-96 Change CAPS_IS_7555 to check ppdev->ulChipID
|
|
*
|
|
* sge06 01-27-97 Extend VCLK Denominator to 7 bits from 5 bits.
|
|
* sge07 02-13-97 Use replication when in 1280x1024x8 mode.
|
|
* myf31 02-24-97 Fixed enable HW Video, panning scrolling enable,screen move
|
|
* video window have follow moving
|
|
* chu03 03-26-97 Bandwidth eqution for the CL-GD5480.
|
|
* myf33 :03-31-97 : Fixed PDR #8709, read true VCLK in getVCLK()
|
|
* & panning scrolling enable, support HW Video
|
|
* chu04 04-02-97 No matterwhat color depth is, always turn on COLORKEY and
|
|
* SRCBLT in the DD/DD colorkey capabilities for the 5480.
|
|
*
|
|
\******************************************************************************/
|
|
|
|
#include "PreComp.h"
|
|
#if DIRECTDRAW
|
|
#include "overlay.h"
|
|
|
|
LONG MIN_OLAY_WIDTH = 4;
|
|
|
|
//#define ONLY54x6 // Comment this line out if DirectDraw should be 'generic'
|
|
|
|
// The next flag controls DirectDraw support in 24-bpp.
|
|
#define DIRECTX_24 2 // 0 - no support
|
|
// 1 - blt support, no heap (flip)
|
|
// 2 - full support
|
|
|
|
//
|
|
// Some handy macros.
|
|
//
|
|
#define BLT_BUSY(ppdev, pjBase) (CP_MM_ACL_STAT(ppdev, pjBase) & 0x01)
|
|
#ifdef ONLY54x6
|
|
#define BLT_READY(ppdev, pjBase) (!(CP_MM_ACL_STAT(ppdev, pjBase) & 0x10))
|
|
#else
|
|
#define BLT_READY(ppdev, pjBase) (!(CP_MM_ACL_STAT(ppdev, pjBase) & \
|
|
((ppdev->flCaps & CAPS_AUTOSTART) ? 0x10 : 0x01)))
|
|
#endif
|
|
|
|
#define NUM_VBLANKS_TO_MEASURE 1
|
|
#define NUM_MEASUREMENTS_TO_TAKE 8
|
|
|
|
|
|
/******************************Public*Routine******************************\
|
|
*
|
|
* DWORD dwGetPaletteEntry
|
|
*
|
|
\**************************************************************************/
|
|
|
|
DWORD dwGetPaletteEntry(
|
|
PDEV* ppdev,
|
|
DWORD iIndex)
|
|
{
|
|
BYTE* pjPorts;
|
|
DWORD dwRed;
|
|
DWORD dwGreen;
|
|
DWORD dwBlue;
|
|
|
|
pjPorts = ppdev->pjPorts;
|
|
|
|
CP_OUT_BYTE(pjPorts, DAC_PEL_READ_ADDR, iIndex);
|
|
|
|
dwRed = CP_IN_BYTE(pjPorts, DAC_PEL_DATA);
|
|
dwGreen = CP_IN_BYTE(pjPorts, DAC_PEL_DATA);
|
|
dwBlue = CP_IN_BYTE(pjPorts, DAC_PEL_DATA);
|
|
|
|
return((dwRed << 16) | (dwGreen << 8) | (dwBlue));
|
|
}
|
|
|
|
/******************************Public*Routine******************************\
|
|
* VOID vGetDisplayDuration
|
|
*
|
|
* Get the length, in EngQueryPerformanceCounter() ticks, of a refresh cycle.
|
|
*
|
|
* If we could trust the miniport to return back and accurate value for
|
|
* the refresh rate, we could use that. Unfortunately, our miniport doesn't
|
|
* ensure that it's an accurate value.
|
|
*
|
|
\**************************************************************************/
|
|
|
|
VOID vGetDisplayDuration(
|
|
PDEV* ppdev)
|
|
{
|
|
BYTE* pjPorts;
|
|
DWORD dwTemp;
|
|
LONG i, j;
|
|
LONGLONG li;
|
|
LONGLONG liMin;
|
|
LONGLONG aliMeasurement[NUM_MEASUREMENTS_TO_TAKE + 1];
|
|
|
|
pjPorts = ppdev->pjPorts;
|
|
|
|
memset(&ppdev->flipRecord, 0, sizeof(ppdev->flipRecord));
|
|
|
|
// Warm up EngQUeryPerformanceCounter to make sure it's in the working set.
|
|
EngQueryPerformanceCounter(&li);
|
|
|
|
// Unfortunately, since NT is a proper multitasking system, we can't just
|
|
// disable interrupts to take an accurate reading. We also can't do anything
|
|
// so goofy as dynamically change our thread's priority to real-time.
|
|
//
|
|
// So we just do a bunch of short measurements and take the minimum.
|
|
//
|
|
// It would be 'okay' if we got a result that's longer than the actual
|
|
// VBlank cycle time -- nothing bad would happen except that the app would
|
|
// run a little slower. We don't want to get a result that's shorter than
|
|
// the actual VBlank cycle time -- that could cause us to start drawing over
|
|
// a frame before the Flip has occured.
|
|
|
|
while (CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE)
|
|
;
|
|
while (!(CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE))
|
|
;
|
|
|
|
for (i = 0; i < NUM_MEASUREMENTS_TO_TAKE; i++)
|
|
{
|
|
// We're at the start of the VBlank active cycle!
|
|
EngQueryPerformanceCounter(&aliMeasurement[i]);
|
|
|
|
// Okay, so life in a multi-tasking environment isn't all that simple.
|
|
// What if we had taken a context switch just before the above
|
|
// EngQueryPerformanceCounter call, and now were half way through the
|
|
// VBlank inactive cycle? Then we would measure only half a VBlank
|
|
// cycle, which is obviously bad. The worst thing we can do is get a
|
|
// time shorter than the actual VBlank cycle time.
|
|
//
|
|
// So we solve this by making sure we're in the VBlank active time
|
|
// before and after we query the time. If it's not, we'll sync up to the
|
|
// next VBlank (it's okay to measure this period -- it will be
|
|
// guaranteed to be longer than the VBlank cycle and will likely be
|
|
// thrown out when we select the minimum sample). There's a chance that
|
|
// we'll take a context switch and return just before the end of the
|
|
// active VBlank time -- meaning that the actual measured time would be
|
|
// less than the true amount -- but since the VBlank is active less than
|
|
// 1% of the time, this means that we would have a maximum of 1% error
|
|
// approximately 1% of the times we take a context switch. An acceptable
|
|
// risk.
|
|
//
|
|
// This next line will cause us wait if we're no longer in the VBlank
|
|
// active cycle as we should be at this point.
|
|
while (!(CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE))
|
|
;
|
|
|
|
for (j = 0; j < NUM_VBLANKS_TO_MEASURE; j++)
|
|
{
|
|
while (CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE)
|
|
;
|
|
while (!(CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE))
|
|
;
|
|
}
|
|
}
|
|
|
|
EngQueryPerformanceCounter(&aliMeasurement[NUM_MEASUREMENTS_TO_TAKE]);
|
|
|
|
// Use the minimum.
|
|
liMin = aliMeasurement[1] - aliMeasurement[0];
|
|
|
|
DISPDBG((2, "Refresh count: %li - %li", 1, (ULONG) liMin));
|
|
|
|
for (i = 2; i <= NUM_MEASUREMENTS_TO_TAKE; i++)
|
|
{
|
|
li = aliMeasurement[i] - aliMeasurement[i - 1];
|
|
|
|
DISPDBG((2, " %li - %li", i, (ULONG) li));
|
|
|
|
if (li < liMin)
|
|
{
|
|
liMin = li;
|
|
}
|
|
}
|
|
|
|
// Round the result:
|
|
|
|
ppdev->flipRecord.liFlipDuration =
|
|
(DWORD) (liMin + (NUM_VBLANKS_TO_MEASURE / 2)) / NUM_VBLANKS_TO_MEASURE;
|
|
|
|
DISPDBG((2, "Frequency %li.%03li Hz",
|
|
(ULONG) (EngQueryPerformanceFrequency(&li),
|
|
li / ppdev->flipRecord.liFlipDuration),
|
|
(ULONG) (EngQueryPerformanceFrequency(&li),
|
|
((li * 1000) / ppdev->flipRecord.liFlipDuration) % 1000)));
|
|
|
|
ppdev->flipRecord.liFlipTime = aliMeasurement[NUM_MEASUREMENTS_TO_TAKE];
|
|
ppdev->flipRecord.bFlipFlag = FALSE;
|
|
ppdev->flipRecord.fpFlipFrom = 0;
|
|
|
|
// sge
|
|
// Get the line on which the VSYNC occurs
|
|
CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x7);
|
|
dwTemp = (DWORD)CP_IN_BYTE(pjPorts, CRTC_DATA);
|
|
ppdev->dwVsyncLine = ((dwTemp & 0x80) << 2);
|
|
ppdev->dwVsyncLine |= ((dwTemp & 0x04) << 6);
|
|
CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x10);
|
|
ppdev->dwVsyncLine |= CP_IN_BYTE(pjPorts, CRTC_DATA);
|
|
}
|
|
|
|
/******************************Public*Routine******************************\
|
|
* HRESULT dwUpdateFlipStatus
|
|
*
|
|
* Checks and sees if the most recent flip has occurred.
|
|
*
|
|
\**************************************************************************/
|
|
|
|
HRESULT UpdateFlipStatus(PDEV* ppdev, FLATPTR fpVidMem)
|
|
{
|
|
BYTE* pjPorts;
|
|
LONGLONG liTime;
|
|
|
|
pjPorts = ppdev->pjPorts;
|
|
|
|
if ((ppdev->flipRecord.bFlipFlag) &&
|
|
//#jc01 ((fpVidMem == 0) || (fpVidMem == ppdev->flipRecord.fpFlipFrom)))
|
|
((fpVidMem == 0xffffffff) || (fpVidMem == ppdev->flipRecord.fpFlipFrom))) //#jc01
|
|
{
|
|
#if 0 // sge use scanline
|
|
if (CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE)
|
|
{
|
|
if (ppdev->flipRecord.bWasEverInDisplay)
|
|
{
|
|
ppdev->flipRecord.bHaveEverCrossedVBlank = TRUE;
|
|
}
|
|
}
|
|
else if (!(CP_IN_BYTE(pjPorts, STATUS_1) & DISPLAY_MODE_INACTIVE))
|
|
{
|
|
if( ppdev->flipRecord.bHaveEverCrossedVBlank )
|
|
{
|
|
ppdev->flipRecord.bFlipFlag = FALSE;
|
|
return(DD_OK);
|
|
}
|
|
ppdev->flipRecord.bWasEverInDisplay = TRUE;
|
|
}
|
|
|
|
EngQueryPerformanceCounter(&liTime);
|
|
|
|
if (liTime - ppdev->flipRecord.liFlipTime
|
|
<= ppdev->flipRecord.liFlipDuration)
|
|
{
|
|
return(DDERR_WASSTILLDRAWING);
|
|
}
|
|
#else
|
|
/*
|
|
* if we aren't in the vertical retrace, we can use the scanline
|
|
* to help decide on what to do
|
|
*/
|
|
if( !(CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE) )
|
|
{
|
|
if( ppdev->flipRecord.bHaveEverCrossedVBlank == FALSE )
|
|
{
|
|
ppdev->flipRecord.bWasEverInDisplay = TRUE;
|
|
if( GetCurrentVLine(ppdev) >= ppdev->flipRecord.dwFlipScanLine )
|
|
{
|
|
EngQueryPerformanceCounter(&liTime);
|
|
|
|
if (liTime - ppdev->flipRecord.liFlipTime
|
|
<= ppdev->flipRecord.liFlipDuration)
|
|
{
|
|
return(DDERR_WASSTILLDRAWING);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
/*
|
|
* in the vertical retrace, scanline is useless
|
|
*/
|
|
else
|
|
{
|
|
if( ppdev->flipRecord.bWasEverInDisplay )
|
|
{
|
|
ppdev->flipRecord.bHaveEverCrossedVBlank = TRUE;
|
|
// return DD_OK;
|
|
}
|
|
EngQueryPerformanceCounter(&liTime);
|
|
if (liTime - ppdev->flipRecord.liFlipTime
|
|
<= ppdev->flipRecord.liFlipDuration)
|
|
{
|
|
return(DDERR_WASSTILLDRAWING);
|
|
}
|
|
}
|
|
#endif // endif use scanline
|
|
ppdev->flipRecord.bFlipFlag = FALSE;
|
|
}
|
|
|
|
return(DD_OK);
|
|
}
|
|
|
|
/******************************Public*Routine******************************\
|
|
* DWORD DdBlt
|
|
*
|
|
\**************************************************************************/
|
|
|
|
DWORD DdBlt(
|
|
PDD_BLTDATA lpBlt)
|
|
{
|
|
PDD_SURFACE_GLOBAL srcSurf;
|
|
PDD_SURFACE_GLOBAL dstSurf;
|
|
PDEV* ppdev;
|
|
BYTE* pjBase;
|
|
DWORD dstOffset;
|
|
DWORD dstPitch;
|
|
DWORD dstX, dstY;
|
|
DWORD dwFlags;
|
|
DWORD width, height;
|
|
DWORD srcOffset;
|
|
DWORD srcPitch;
|
|
DWORD srcX, srcY;
|
|
ULONG ulBltCmd;
|
|
DWORD xExt, yExt;
|
|
DWORD xDiff, yDiff;
|
|
|
|
ppdev = lpBlt->lpDD->dhpdev;
|
|
pjBase = ppdev->pjBase;
|
|
dstSurf = lpBlt->lpDDDestSurface->lpGbl;
|
|
|
|
// Is a flip in progress?
|
|
if (UpdateFlipStatus(ppdev, dstSurf->fpVidMem) != DD_OK)
|
|
{
|
|
lpBlt->ddRVal = DDERR_WASSTILLDRAWING;
|
|
return(DDHAL_DRIVER_HANDLED);
|
|
}
|
|
|
|
dwFlags = lpBlt->dwFlags;
|
|
|
|
if (dwFlags & DDBLT_ASYNC)
|
|
{
|
|
// If async, then only work if we won't have to wait on the accelerator
|
|
// to start the command.
|
|
if (!BLT_READY(ppdev, pjBase))
|
|
{
|
|
lpBlt->ddRVal = DDERR_WASSTILLDRAWING;
|
|
return(DDHAL_DRIVER_HANDLED);
|
|
}
|
|
}
|
|
|
|
DISPDBG((2, "DdBlt Entered"));
|
|
|
|
// Calculate destination parameters.
|
|
dstX = lpBlt->rDest.left;
|
|
dstY = lpBlt->rDest.top;
|
|
width = PELS_TO_BYTES(lpBlt->rDest.right - dstX) - 1;
|
|
height = (lpBlt->rDest.bottom - dstY) - 1;
|
|
dstPitch = dstSurf->lPitch;
|
|
dstOffset = (DWORD)(dstSurf->fpVidMem + PELS_TO_BYTES(dstX)
|
|
+ (dstY * dstPitch));
|
|
|
|
// Color fill?
|
|
if (dwFlags & DDBLT_COLORFILL)
|
|
{
|
|
ULONG ulBltMode = ENABLE_COLOR_EXPAND
|
|
| ENABLE_8x8_PATTERN_COPY
|
|
| ppdev->jModeColor;
|
|
|
|
// Wait for the accelerator.
|
|
while (!BLT_READY(ppdev, pjBase))
|
|
;
|
|
|
|
// Program bitblt engine.
|
|
CP_MM_ROP(ppdev, pjBase, HW_P);
|
|
CP_MM_DST_Y_OFFSET(ppdev, pjBase, dstPitch);
|
|
CP_MM_BLT_MODE(ppdev, pjBase, ulBltMode);
|
|
CP_MM_FG_COLOR(ppdev, pjBase, lpBlt->bltFX.dwFillColor);
|
|
if (ppdev->flCaps & CAPS_AUTOSTART)
|
|
{
|
|
CP_MM_BLT_EXT_MODE(ppdev, pjBase, ENABLE_SOLID_FILL);
|
|
}
|
|
else
|
|
{
|
|
CP_MM_SRC_ADDR(ppdev, pjBase, ppdev->ulSolidColorOffset);
|
|
}
|
|
CP_MM_XCNT(ppdev, pjBase, width);
|
|
CP_MM_YCNT(ppdev, pjBase, height);
|
|
CP_MM_DST_ADDR_ABS(ppdev, pjBase, dstOffset);
|
|
CP_MM_START_BLT(ppdev, pjBase);
|
|
|
|
lpBlt->ddRVal = DD_OK;
|
|
return(DDHAL_DRIVER_HANDLED);
|
|
}
|
|
|
|
|
|
// We specified with Our ddCaps.dwCaps that we handle a limited number of
|
|
// commands, and by this point in our routine we've handled everything
|
|
// except DDBLT_ROP. DirectDraw and GDI shouldn't pass us anything else;
|
|
// we'll assert on debug builds to prove this.
|
|
ASSERTDD((dwFlags & DDBLT_ROP) && (lpBlt->lpDDSrcSurface),
|
|
"Expected dwFlags commands of only DDBLT_ASYNC and DDBLT_COLORFILL");
|
|
|
|
// Get offset, width, and height for source.
|
|
srcSurf = lpBlt->lpDDSrcSurface->lpGbl;
|
|
srcX = lpBlt->rSrc.left;
|
|
srcY = lpBlt->rSrc.top;
|
|
srcPitch = srcSurf->lPitch;
|
|
srcOffset = (DWORD)(srcSurf->fpVidMem + PELS_TO_BYTES(srcX)
|
|
+ (srcY * srcPitch));
|
|
|
|
/*
|
|
* Account for PackJR. If the start and the width are not 4 pixel
|
|
* aligned, we need to BLT this by hand. Otherwsie, if they think
|
|
* they are BLTing 16 bit data, we must adjust the parameters now.
|
|
*
|
|
* This is also a good place to check that YUV BLTs are 2 pixel
|
|
* aligned.
|
|
*/
|
|
if (lpBlt->lpDDDestSurface->dwReserved1 & (OVERLAY_FLG_PACKJR | OVERLAY_FLG_YUV422))
|
|
{
|
|
|
|
ASSERTDD(0, "Who will get here?");
|
|
#if 0 // software blt
|
|
/*
|
|
* Check YUV first. We can fail this if incorrect because the client
|
|
* should know better (since they are explicitly use YUV).
|
|
*/
|
|
if ((lpBlt->lpDDDestSurface->dwReserved1 & OVERLAY_FLG_YUV422) &&
|
|
((lpBlt->rSrc.left & 0x01) != (lpBlt->rDest.left & 0x01)))
|
|
{
|
|
lpBlt->ddRVal = DDERR_XALIGN;
|
|
return (DDHAL_DRIVER_HANDLED);
|
|
}
|
|
|
|
/*
|
|
* If PackJR is wrong, we must make this work ourselves because we
|
|
* may be converting to this w/o the client knowing.
|
|
*/
|
|
else if (lpBlt->lpDDDestSurface->dwReserved1 & OVERLAY_FLG_PACKJR)
|
|
{
|
|
if (dwFlags & DDBLT_COLORFILL)
|
|
{
|
|
lpBlt->ddRVal = DDERR_XALIGN;
|
|
return (DDHAL_DRIVER_HANDLED);
|
|
}
|
|
|
|
if ((lpBlt->rSrc.left & 0x03) || (lpBlt->rDest.left & 0x03))
|
|
{
|
|
/*
|
|
* The start doesn't align - we have to do this the slow way
|
|
*/
|
|
PackJRBltAlign ((LPBYTE) ppdev->pjScreen + srcOffset,
|
|
(LPBYTE) ppdev->pjScreen + dstOffset,
|
|
lpBlt->rDest.right - lpBlt->rDest.left,
|
|
lpBlt->rDest.bottom - lpBlt->rDest.top,
|
|
srcPitch, dstPitch);
|
|
|
|
lpBlt->ddRVal = DD_OK;
|
|
return (DDHAL_DRIVER_HANDLED);
|
|
}
|
|
else if (lpBlt->rSrc.right & 0x03)
|
|
{
|
|
/*
|
|
* The end doesn't align - we will do the BLT as normal, but
|
|
* write the last pixels the slow way
|
|
*/
|
|
if (lpBlt->lpDDDestSurface->dwReserved1 & (OVERLAY_FLG_CONVERT_PACKJR | OVERLAY_FLG_MUST_RASTER))
|
|
{
|
|
srcPitch >>= 1;
|
|
srcOffset = srcSurf->fpVidMem + PELS_TO_BYTES(srcX) + (srcY * srcPitch);
|
|
dstPitch >>= 1;
|
|
dstOffset = dstSurf->fpVidMem + PELS_TO_BYTES(dstX) + (dstY * dstPitch);
|
|
}
|
|
width = ((WORD)lpBlt->rSrc.right & ~0x03) - (WORD)lpBlt->rSrc.left;
|
|
PackJRBltAlignEnd ((LPBYTE) ppdev->pjScreen + srcOffset + width,
|
|
(LPBYTE) ppdev->pjScreen + dstOffset + width,
|
|
lpBlt->rSrc.right & 0x03,
|
|
lpBlt->rDest.bottom - lpBlt->rDest.top, srcPitch, dstPitch);
|
|
}
|
|
else if (lpBlt->lpDDDestSurface->dwReserved1 & (OVERLAY_FLG_CONVERT_PACKJR | OVERLAY_FLG_MUST_RASTER))
|
|
{
|
|
/*
|
|
* Everything aligns, but we have to re-calculate the start
|
|
* address and the pitch.
|
|
*/
|
|
srcPitch >>= 1;
|
|
srcOffset = srcSurf->fpVidMem + PELS_TO_BYTES(srcX) + (srcY * srcPitch);
|
|
dstPitch >>= 1;
|
|
dstOffset = dstSurf->fpVidMem + PELS_TO_BYTES(dstX) + (dstY * dstPitch);
|
|
width >>= 1;
|
|
}
|
|
}
|
|
#endif
|
|
}
|
|
|
|
if ((dstSurf == srcSurf) && (srcOffset < dstOffset))
|
|
{
|
|
// Okay, we have to do the blt bottom-to-top, right-to-left.
|
|
ulBltCmd = DIR_BTRL;
|
|
;
|
|
srcOffset += width + (srcPitch * height);
|
|
dstOffset += width + (dstPitch * height);
|
|
}
|
|
else
|
|
{
|
|
// Okay, we have to do the blt top-to-bottom, left-to-right.
|
|
ulBltCmd = DIR_TBLR;
|
|
}
|
|
|
|
// Wait for the accelerator.
|
|
while (!BLT_READY(ppdev, pjBase))
|
|
;
|
|
|
|
//
|
|
// What about source color key
|
|
//
|
|
ASSERTDD((!(dwFlags & DDBLT_KEYSRC)), "Do not expected source color key");
|
|
|
|
if (dwFlags & DDBLT_KEYSRCOVERRIDE)
|
|
{
|
|
ULONG ulColor;
|
|
|
|
//
|
|
// sge02
|
|
//
|
|
ulBltCmd |= ENABLE_TRANSPARENCY_COMPARE | ppdev->jModeColor;
|
|
ulColor = lpBlt->bltFX.ddckSrcColorkey.dwColorSpaceLowValue;
|
|
if (ppdev->cBpp == 1)
|
|
{
|
|
ulColor |= ulColor << 8;
|
|
}
|
|
CP_WRITE_USHORT(pjBase, MM_BLT_COLOR_KEY, ulColor);
|
|
}
|
|
|
|
if ( (ulBltCmd & DIR_BTRL)
|
|
&& (ulBltCmd & ENABLE_TRANSPARENCY_COMPARE)
|
|
&& (ppdev->cBpp > 1)
|
|
)
|
|
{
|
|
ulBltCmd &= ~DIR_BTRL;
|
|
xExt = lpBlt->rDest.right - lpBlt->rDest.left;
|
|
yExt = lpBlt->rDest.bottom - lpBlt->rDest.top;
|
|
xDiff = dstX - srcX;
|
|
yDiff = dstY - srcY;
|
|
|
|
if (yDiff == 0)
|
|
{
|
|
srcOffset -= srcPitch * height - 1;
|
|
dstOffset -= dstPitch * height - 1;
|
|
|
|
while (xExt)
|
|
{
|
|
width = PELS_TO_BYTES(min(xDiff, xExt));
|
|
srcOffset -= width;
|
|
dstOffset -= width;
|
|
|
|
while (!BLT_READY(ppdev, pjBase)) ;
|
|
|
|
CP_MM_ROP(ppdev, pjBase, CL_SRC_COPY);
|
|
CP_MM_BLT_MODE(ppdev, pjBase, ulBltCmd);
|
|
CP_MM_BLT_EXT_MODE(ppdev, pjBase, 0);
|
|
CP_MM_SRC_Y_OFFSET(ppdev, pjBase, srcPitch);
|
|
CP_MM_DST_Y_OFFSET(ppdev, pjBase, dstPitch);
|
|
CP_MM_XCNT(ppdev, pjBase, width - 1);
|
|
CP_MM_YCNT(ppdev, pjBase, height);
|
|
CP_MM_SRC_ADDR(ppdev, pjBase, srcOffset);
|
|
CP_MM_DST_ADDR_ABS(ppdev, pjBase, dstOffset);
|
|
CP_MM_START_BLT(ppdev, pjBase);
|
|
|
|
xExt -= min(xDiff, xExt);
|
|
}
|
|
}
|
|
else
|
|
{
|
|
srcOffset -= width - srcPitch;
|
|
dstOffset -= width - dstPitch;
|
|
|
|
while (yExt)
|
|
{
|
|
height = min(yDiff, yExt);
|
|
srcOffset -= height * srcPitch;
|
|
dstOffset -= height * dstPitch;
|
|
|
|
while (!BLT_READY(ppdev, pjBase)) ;
|
|
|
|
CP_MM_ROP(ppdev, pjBase, CL_SRC_COPY);
|
|
CP_MM_BLT_MODE(ppdev, pjBase, ulBltCmd);
|
|
CP_MM_BLT_EXT_MODE(ppdev, pjBase, 0);
|
|
CP_MM_SRC_Y_OFFSET(ppdev, pjBase, srcPitch);
|
|
CP_MM_DST_Y_OFFSET(ppdev, pjBase, dstPitch);
|
|
CP_MM_XCNT(ppdev, pjBase, width);
|
|
CP_MM_YCNT(ppdev, pjBase, height - 1);
|
|
CP_MM_SRC_ADDR(ppdev, pjBase, srcOffset);
|
|
CP_MM_DST_ADDR_ABS(ppdev, pjBase, dstOffset);
|
|
CP_MM_START_BLT(ppdev, pjBase);
|
|
|
|
yExt -= min(yDiff, yExt);
|
|
}
|
|
}
|
|
}
|
|
|
|
else
|
|
{
|
|
CP_MM_ROP(ppdev, pjBase, CL_SRC_COPY);
|
|
CP_MM_BLT_MODE(ppdev, pjBase, ulBltCmd);
|
|
CP_MM_BLT_EXT_MODE(ppdev, pjBase, 0); // jl01
|
|
CP_MM_SRC_Y_OFFSET(ppdev, pjBase, srcPitch);
|
|
CP_MM_DST_Y_OFFSET(ppdev, pjBase, dstPitch);
|
|
CP_MM_XCNT(ppdev, pjBase, width);
|
|
CP_MM_YCNT(ppdev, pjBase, height);
|
|
CP_MM_SRC_ADDR(ppdev, pjBase, srcOffset);
|
|
CP_MM_DST_ADDR_ABS(ppdev, pjBase, dstOffset);
|
|
CP_MM_START_BLT(ppdev, pjBase);
|
|
}
|
|
|
|
lpBlt->ddRVal = DD_OK;
|
|
return(DDHAL_DRIVER_HANDLED);
|
|
}
|
|
|
|
/******************************Public*Routine******************************\
|
|
* DWORD DdFlip
|
|
*
|
|
\**************************************************************************/
|
|
|
|
DWORD DdFlip(
|
|
PDD_FLIPDATA lpFlip)
|
|
{
|
|
PDEV* ppdev;
|
|
BYTE* pjPorts;
|
|
ULONG ulMemoryOffset;
|
|
ULONG ulLowOffset;
|
|
ULONG ulMiddleOffset;
|
|
ULONG ulHighOffset1, ulHighOffset2;
|
|
|
|
ppdev = lpFlip->lpDD->dhpdev;
|
|
pjPorts = ppdev->pjPorts;
|
|
|
|
DISPDBG((2, "DdFlip: %d x %d at %08x(%d, %d) Pitch=%d",
|
|
lpFlip->lpSurfTarg->lpGbl->wWidth,
|
|
lpFlip->lpSurfTarg->lpGbl->wHeight,
|
|
lpFlip->lpSurfTarg->lpGbl->fpVidMem,
|
|
lpFlip->lpSurfTarg->lpGbl->xHint,
|
|
lpFlip->lpSurfTarg->lpGbl->yHint,
|
|
lpFlip->lpSurfTarg->lpGbl->lPitch));
|
|
|
|
// Is the current flip still in progress?
|
|
//
|
|
// Don't want a flip to work until after the last flip is done, so we ask
|
|
// for the general flip status and ignore the vmem.
|
|
//#jc01 if ((UpdateFlipStatus(ppdev, 0) != DD_OK) ||
|
|
if ((UpdateFlipStatus(ppdev, 0xffffffff) != DD_OK) || /* #jc01 */
|
|
(BLT_BUSY(ppdev, ppdev->pjBase)))
|
|
{
|
|
lpFlip->ddRVal = DDERR_WASSTILLDRAWING;
|
|
return(DDHAL_DRIVER_HANDLED);
|
|
}
|
|
|
|
ulMemoryOffset = (ULONG)(lpFlip->lpSurfTarg->lpGbl->fpVidMem);
|
|
// Make sure that the border/blanking period isn't active; wait if it is. We
|
|
// could return DDERR_WASSTILLDRAWING in this case, but that will increase
|
|
// the odds that we can't flip the next time.
|
|
while (CP_IN_BYTE(pjPorts, STATUS_1) & DISPLAY_MODE_INACTIVE)
|
|
;
|
|
DISPDBG((2, "DdFlip Entered"));
|
|
#if 1 // OVERLAY #sge
|
|
if (lpFlip->lpSurfCurr->ddsCaps.dwCaps & DDSCAPS_OVERLAY)
|
|
{
|
|
DWORD dwOffset;
|
|
BYTE bRegCR3A;
|
|
BYTE bRegCR3B;
|
|
BYTE bRegCR3C;
|
|
// Make sure that the overlay surface we're flipping from is
|
|
// currently visible. If you don't do this check, you'll get
|
|
// really weird results when someone starts up two ActiveMovie
|
|
// or DirectVideo movies simultaneously!
|
|
|
|
if (lpFlip->lpSurfCurr->lpGbl->fpVidMem == ppdev->fpVisibleOverlay)
|
|
{
|
|
ppdev->fpVisibleOverlay = ulMemoryOffset;
|
|
/*
|
|
* Determine the offset to the new area.
|
|
*/
|
|
// dwOffset = ((ulMemoryOffset - (ULONG)ppdev->pjScreen) + ppdev->sOverlay1.lAdjustSource) >> 2; // sss
|
|
dwOffset = ((ulMemoryOffset + ppdev->sOverlay1.lAdjustSource) >> 2);
|
|
|
|
/*
|
|
* Flip the overlay surface by changing CR3A, CR3B, and CR3C
|
|
*/
|
|
bRegCR3A = (BYTE) dwOffset & 0xfe; // Align on word boundary (5446 bug)
|
|
dwOffset >>= 8;
|
|
bRegCR3B = (BYTE) dwOffset;
|
|
dwOffset >>= 8;
|
|
bRegCR3C = (BYTE) (dwOffset & 0x0f);
|
|
// if(GetOverlayFlipStatus(0) != DD_OK || DRAW_ENGINE_BUSY || IN_VBLANK)
|
|
// {
|
|
// lpFlipData->ddRVal = DDERR_WASSTILLDRAWING;
|
|
// return DDHAL_DRIVER_HANDLED;
|
|
// }
|
|
|
|
CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x3C);
|
|
CP_OUT_BYTE(pjPorts, CRTC_DATA, (CP_IN_BYTE(pjPorts, CRTC_DATA) & 0xf0) | bRegCR3C);
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD)bRegCR3A << 8) | 0x3A);
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD)bRegCR3B << 8) | 0x3B);
|
|
}
|
|
else
|
|
{
|
|
lpFlip->ddRVal = DDERR_OUTOFCAPS;
|
|
return(DDHAL_DRIVER_HANDLED);
|
|
}
|
|
}
|
|
else
|
|
#endif // OVERLAY
|
|
{
|
|
// Do the flip.
|
|
ulMemoryOffset >>= 2;
|
|
|
|
ulLowOffset = 0x0D | ((ulMemoryOffset & 0x0000FF) << 8);
|
|
ulMiddleOffset = 0x0C | ((ulMemoryOffset & 0x00FF00));
|
|
ulHighOffset1 = 0x1B | ((ulMemoryOffset & 0x010000) >> 8)
|
|
| ((ulMemoryOffset & 0x060000) >> 7)
|
|
| ppdev->ulCR1B;
|
|
ulHighOffset2 = 0x1D | ((ulMemoryOffset & 0x080000) >> 4)
|
|
| ppdev->ulCR1D;
|
|
|
|
// Too bad that the Cirrus flip can't be done in a single atomic register
|
|
// write; as it is, we stand a small chance of being context-switched out
|
|
// and exactly hitting the vertical blank in the middle of doing these outs,
|
|
// possibly causing the screen to momentarily jump.
|
|
//
|
|
// There are some hoops we could jump through to minimize the chances of
|
|
// this happening; we could try to align the flip buffer such that the minor
|
|
// registers are ensured to be identical for either flip position, ans so
|
|
// that only the high address need be written, an obviously atomic
|
|
// operation.
|
|
//
|
|
// However, I'm simply not going to worry about it.
|
|
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ulHighOffset2);
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ulHighOffset1);
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ulMiddleOffset);
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ulLowOffset);
|
|
}
|
|
// Remember where and when we were when we did the flip.
|
|
EngQueryPerformanceCounter(&ppdev->flipRecord.liFlipTime);
|
|
|
|
ppdev->flipRecord.bFlipFlag = TRUE;
|
|
ppdev->flipRecord.bHaveEverCrossedVBlank = FALSE;
|
|
|
|
ppdev->flipRecord.fpFlipFrom = lpFlip->lpSurfCurr->lpGbl->fpVidMem;
|
|
|
|
if((CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE))
|
|
{
|
|
ppdev->flipRecord.dwFlipScanLine = 0;
|
|
ppdev->flipRecord.bWasEverInDisplay = FALSE;
|
|
}
|
|
else
|
|
{
|
|
ppdev->flipRecord.dwFlipScanLine = GetCurrentVLine(ppdev);
|
|
ppdev->flipRecord.bWasEverInDisplay = TRUE;
|
|
}
|
|
|
|
lpFlip->ddRVal = DD_OK;
|
|
return(DDHAL_DRIVER_HANDLED);
|
|
}
|
|
|
|
/******************************Public*Routine******************************\
|
|
* DWORD DdLock
|
|
*
|
|
\**************************************************************************/
|
|
|
|
DWORD DdLock(PDD_LOCKDATA lpLock)
|
|
{
|
|
PDEV* ppdev = lpLock->lpDD->dhpdev;
|
|
BYTE* pjPorts = ppdev->pjPorts;
|
|
|
|
// Check to see if any pending physical flip has occurred. Don't allow a
|
|
// lock if a blt is in progress.
|
|
if (UpdateFlipStatus(ppdev, lpLock->lpDDSurface->lpGbl->fpVidMem)
|
|
!= DD_OK)
|
|
{
|
|
lpLock->ddRVal = DDERR_WASSTILLDRAWING;
|
|
return(DDHAL_DRIVER_HANDLED);
|
|
}
|
|
if (lpLock->dwFlags & DDLOCK_WAIT)
|
|
{
|
|
CP_MM_WAIT_FOR_BLT_COMPLETE(ppdev, ppdev->pjBase);
|
|
}
|
|
if (BLT_BUSY(ppdev, ppdev->pjBase))
|
|
{
|
|
lpLock->ddRVal = DDERR_WASSTILLDRAWING;
|
|
return(DDHAL_DRIVER_HANDLED);
|
|
}
|
|
|
|
/*
|
|
* Force them to use the video apperture
|
|
*/
|
|
if ((lpLock->lpDDSurface->dwReserved1 & OVERLAY_FLG_OVERLAY) &&
|
|
(lpLock->dwFlags == DDLOCK_SURFACEMEMORYPTR) &&
|
|
(ppdev->fpBaseOverlay != 0xffffffff))
|
|
{
|
|
|
|
if (lpLock->lpDDSurface->dwReserved1 & OVERLAY_FLG_DECIMATE)
|
|
{
|
|
/*
|
|
* Turn on decimation
|
|
*/
|
|
CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x3f);
|
|
CP_OUT_BYTE(pjPorts, CRTC_DATA, CP_IN_BYTE(pjPorts, CRTC_DATA) | 0x10);
|
|
|
|
}
|
|
if( lpLock->lpDDSurface->lpGbl->ddpfSurface.dwFourCC == FOURCC_YUY2)
|
|
lpLock->lpSurfData = (LPVOID)(ppdev->fpBaseOverlay + lpLock->lpDDSurface->lpGbl->fpVidMem + 0x400000);
|
|
else
|
|
lpLock->lpSurfData = (LPVOID)(ppdev->fpBaseOverlay + lpLock->lpDDSurface->lpGbl->fpVidMem + 0x400000 * 3);
|
|
|
|
// When a driver returns DD_OK and DDHAL_DRIVER_HANDLED from DdLock,
|
|
// DirectDraw expects it to have adjusted the resulting pointer
|
|
// to point to the upper left corner of the specified rectangle, if
|
|
// any:
|
|
|
|
if (lpLock->bHasRect)
|
|
{
|
|
lpLock->lpSurfData = (VOID*) ((BYTE*) lpLock->lpSurfData
|
|
+ lpLock->rArea.top * lpLock->lpDDSurface->lpGbl->lPitch
|
|
+ lpLock->rArea.left
|
|
* (lpLock->lpDDSurface->lpGbl->ddpfSurface.dwYUVBitCount >> 3));
|
|
}
|
|
|
|
lpLock->ddRVal = DD_OK;
|
|
return(DDHAL_DRIVER_HANDLED);
|
|
}
|
|
return(DDHAL_DRIVER_NOTHANDLED);
|
|
}
|
|
|
|
/******************************Public*Routine******************************\
|
|
* DWORD DdUnlock
|
|
*
|
|
\**************************************************************************/
|
|
|
|
DWORD DdUnlock(PDD_UNLOCKDATA lpUnlock)
|
|
{
|
|
PDEV* ppdev = lpUnlock->lpDD->dhpdev;
|
|
BYTE* pjPorts = ppdev->pjPorts;
|
|
|
|
if ((lpUnlock->lpDDSurface->dwReserved1 & OVERLAY_FLG_YUVPLANAR) &&
|
|
!(lpUnlock->lpDDSurface->dwReserved1 & OVERLAY_FLG_ENABLED))
|
|
{
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, (0x00 << 8) | 0x3f); // Turn off YUV Planar
|
|
}
|
|
|
|
else if (lpUnlock->lpDDSurface->dwReserved1 & OVERLAY_FLG_DECIMATE)
|
|
{
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, (0x00 << 8) | 0x3f); // Turn off YUV Planar
|
|
}
|
|
|
|
return(DDHAL_DRIVER_NOTHANDLED);
|
|
}
|
|
|
|
/******************************Public*Routine******************************\
|
|
* DWORD DdGetBltStatus
|
|
*
|
|
* Doesn't currently really care what surface is specified, just checks
|
|
* and goes.
|
|
*
|
|
\**************************************************************************/
|
|
|
|
DWORD DdGetBltStatus(PDD_GETBLTSTATUSDATA lpGetBltStatus)
|
|
{
|
|
PDEV* ppdev;
|
|
HRESULT ddRVal;
|
|
PBYTE pjBase;
|
|
|
|
ppdev = lpGetBltStatus->lpDD->dhpdev;
|
|
pjBase = ppdev->pjBase;
|
|
|
|
ddRVal = DD_OK;
|
|
if (lpGetBltStatus->dwFlags == DDGBS_CANBLT)
|
|
{
|
|
// DDGBS_CANBLT case: can we add a blt?
|
|
ddRVal = UpdateFlipStatus(ppdev, lpGetBltStatus->lpDDSurface->lpGbl->fpVidMem);
|
|
|
|
if (ddRVal == DD_OK)
|
|
{
|
|
// There was no flip going on, so can the blitter accept new
|
|
// register writes?
|
|
if (!BLT_READY(ppdev, pjBase))
|
|
{
|
|
ddRVal = DDERR_WASSTILLDRAWING;
|
|
}
|
|
}
|
|
}
|
|
else
|
|
{
|
|
// DDGBS_ISBLTDONE case: is a blt in progress?
|
|
if (BLT_BUSY(ppdev, pjBase))
|
|
{
|
|
ddRVal = DDERR_WASSTILLDRAWING;
|
|
}
|
|
}
|
|
|
|
lpGetBltStatus->ddRVal = ddRVal;
|
|
return(DDHAL_DRIVER_HANDLED);
|
|
}
|
|
|
|
/******************************Public*Routine******************************\
|
|
* DWORD DdMapMemory
|
|
*
|
|
* This is a new DDI call specific to Windows NT that is used to map
|
|
* or unmap all the application modifiable portions of the frame buffer
|
|
* into the specified process's address space.
|
|
*
|
|
\**************************************************************************/
|
|
|
|
DWORD DdMapMemory(PDD_MAPMEMORYDATA lpMapMemory)
|
|
{
|
|
PDEV* ppdev;
|
|
VIDEO_SHARE_MEMORY ShareMemory;
|
|
VIDEO_SHARE_MEMORY_INFORMATION ShareMemoryInformation;
|
|
DWORD ReturnedDataLength;
|
|
|
|
ppdev = lpMapMemory->lpDD->dhpdev;
|
|
|
|
if (lpMapMemory->bMap)
|
|
{
|
|
ShareMemory.ProcessHandle = lpMapMemory->hProcess;
|
|
|
|
// 'RequestedVirtualAddress' isn't actually used for the SHARE IOCTL.
|
|
ShareMemory.RequestedVirtualAddress = 0;
|
|
|
|
// We map in starting at the top of the frame buffer.
|
|
ShareMemory.ViewOffset = 0;
|
|
|
|
// We map down to the end of the frame buffer.
|
|
//
|
|
// Note: There is a 64k granularity on the mapping (meaning that we
|
|
// have to round up to 64k).
|
|
//
|
|
// Note: If there is any portion of the frame buffer that must not be
|
|
// modified by an application, that portion of memory MUST NOT be
|
|
// mapped in by this call. This would include any data that, if
|
|
// modified by a malicious application, would cause the driver to
|
|
// crash. This could include, for example, any DSP code that is
|
|
// kept in off-screen memory.
|
|
|
|
ShareMemory.ViewSize = ROUND_UP_TO_64K(ppdev->cyMemory * ppdev->lDelta + 0x400000 * 3);
|
|
|
|
if (EngDeviceIoControl(ppdev->hDriver,
|
|
IOCTL_VIDEO_SHARE_VIDEO_MEMORY,
|
|
&ShareMemory,
|
|
sizeof(VIDEO_SHARE_MEMORY),
|
|
&ShareMemoryInformation,
|
|
sizeof(VIDEO_SHARE_MEMORY_INFORMATION),
|
|
&ReturnedDataLength))
|
|
{
|
|
DISPDBG((0, "Failed IOCTL_VIDEO_SHARE_MEMORY"));
|
|
|
|
lpMapMemory->ddRVal = DDERR_GENERIC;
|
|
return(DDHAL_DRIVER_HANDLED);
|
|
}
|
|
|
|
lpMapMemory->fpProcess =(FLATPTR)ShareMemoryInformation.VirtualAddress;
|
|
ppdev->fpBaseOverlay = lpMapMemory->fpProcess;
|
|
}
|
|
else
|
|
{
|
|
ShareMemory.ProcessHandle = lpMapMemory->hProcess;
|
|
ShareMemory.ViewOffset = 0;
|
|
ShareMemory.ViewSize = 0;
|
|
ShareMemory.RequestedVirtualAddress = (VOID*) lpMapMemory->fpProcess;
|
|
//
|
|
// Active movie will unmap memory twice
|
|
//
|
|
//if (ppdev->fpBaseOverlay == lpMapMemory->fpProcess)
|
|
// ppdev->fpBaseOverlay = 0;
|
|
|
|
if (EngDeviceIoControl(ppdev->hDriver,
|
|
IOCTL_VIDEO_UNSHARE_VIDEO_MEMORY,
|
|
&ShareMemory,
|
|
sizeof(VIDEO_SHARE_MEMORY),
|
|
NULL,
|
|
0,
|
|
&ReturnedDataLength))
|
|
{
|
|
RIP("Failed IOCTL_VIDEO_UNSHARE_MEMORY");
|
|
}
|
|
}
|
|
|
|
lpMapMemory->ddRVal = DD_OK;
|
|
return(DDHAL_DRIVER_HANDLED);
|
|
}
|
|
|
|
/******************************Public*Routine******************************\
|
|
* DWORD DdGetFlipStatus
|
|
*
|
|
* If the display has gone through one refresh cycle since the flip
|
|
* occurred, we return DD_OK. If it has not gone through one refresh
|
|
* cycle we return DDERR_WASSTILLDRAWING to indicate that this surface
|
|
* is still busy "drawing" the flipped page. We also return
|
|
* DDERR_WASSTILLDRAWING if the bltter is busy and the caller wanted
|
|
* to know if they could flip yet.
|
|
*
|
|
\**************************************************************************/
|
|
|
|
DWORD DdGetFlipStatus(
|
|
PDD_GETFLIPSTATUSDATA lpGetFlipStatus)
|
|
{
|
|
HRESULT ddRVal;
|
|
PDEV* ppdev = lpGetFlipStatus->lpDD->dhpdev;
|
|
|
|
// We don't want a flip to work until after the last flip is done, so we ask
|
|
// for the general flip status and ignore the vmem.
|
|
|
|
//#jc01 ddRVal = UpdateFlipStatus(ppdev, 0);
|
|
ddRVal = UpdateFlipStatus(ppdev, 0xffffffff); //#jc01
|
|
|
|
// Check if the blitter is busy if someone wants to know if they can flip.
|
|
if ((lpGetFlipStatus->dwFlags == DDGFS_CANFLIP) && (ddRVal == DD_OK))
|
|
{
|
|
if (BLT_BUSY(ppdev, ppdev->pjBase))
|
|
{
|
|
ddRVal = DDERR_WASSTILLDRAWING;
|
|
}
|
|
}
|
|
|
|
lpGetFlipStatus->ddRVal = ddRVal;
|
|
return(DDHAL_DRIVER_HANDLED);
|
|
}
|
|
|
|
/******************************Public*Routine******************************\
|
|
* DWORD DdWaitForVerticalBlank
|
|
*
|
|
\**************************************************************************/
|
|
|
|
DWORD DdWaitForVerticalBlank(
|
|
PDD_WAITFORVERTICALBLANKDATA lpWaitForVerticalBlank)
|
|
{
|
|
PDEV* ppdev;
|
|
BYTE* pjPorts;
|
|
|
|
ppdev = lpWaitForVerticalBlank->lpDD->dhpdev;
|
|
pjPorts = ppdev->pjPorts;
|
|
|
|
lpWaitForVerticalBlank->ddRVal = DD_OK;
|
|
|
|
switch (lpWaitForVerticalBlank->dwFlags)
|
|
{
|
|
case DDWAITVB_I_TESTVB:
|
|
|
|
// If TESTVB, it's just a request for the current vertical blank status.
|
|
if (CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE)
|
|
lpWaitForVerticalBlank->bIsInVB = TRUE;
|
|
else
|
|
lpWaitForVerticalBlank->bIsInVB = FALSE;
|
|
|
|
return(DDHAL_DRIVER_HANDLED);
|
|
|
|
case DDWAITVB_BLOCKBEGIN:
|
|
|
|
// If BLOCKBEGIN is requested, we wait until the vertical blank is over,
|
|
// and then wait for the display period to end.
|
|
while (CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE)
|
|
;
|
|
while (!(CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE))
|
|
;
|
|
|
|
return(DDHAL_DRIVER_HANDLED);
|
|
|
|
case DDWAITVB_BLOCKEND:
|
|
|
|
// If BLOCKEND is requested, we wait for the vblank interval to end.
|
|
while (!(CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE))
|
|
;
|
|
while (CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE)
|
|
;
|
|
|
|
return(DDHAL_DRIVER_HANDLED);
|
|
}
|
|
|
|
return(DDHAL_DRIVER_NOTHANDLED);
|
|
}
|
|
|
|
/******************************Public*Routine******************************\
|
|
* DWORD DdGetScanLine
|
|
*
|
|
* Reads the scan line currently being scanned by the CRT.
|
|
*
|
|
\**************************************************************************/
|
|
|
|
DWORD DdGetScanLine(
|
|
PDD_GETSCANLINEDATA lpGetScanLine)
|
|
{
|
|
PDEV* ppdev;
|
|
BYTE* pjPorts;
|
|
|
|
ppdev = (PDEV*) lpGetScanLine->lpDD->dhpdev;
|
|
pjPorts = ppdev->pjPorts;
|
|
|
|
/*
|
|
* If a vertical blank is in progress the scan line is in
|
|
* indeterminant. If the scan line is indeterminant we return
|
|
* the error code DDERR_VERTICALBLANKINPROGRESS.
|
|
* Otherwise we return the scan line and a success code
|
|
*/
|
|
if( CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE )
|
|
{
|
|
lpGetScanLine->ddRVal = DDERR_VERTICALBLANKINPROGRESS;
|
|
}
|
|
else
|
|
{
|
|
lpGetScanLine->dwScanLine = GetCurrentVLine(ppdev);
|
|
lpGetScanLine->ddRVal = DD_OK;
|
|
}
|
|
return(DDHAL_DRIVER_HANDLED);
|
|
}
|
|
|
|
/******************************Public*Routine******************************\
|
|
* DWORD DdCanCreateSurface
|
|
*
|
|
\**************************************************************************/
|
|
|
|
DWORD DdCanCreateSurface(
|
|
PDD_CANCREATESURFACEDATA lpCanCreateSurface)
|
|
{
|
|
PDEV* ppdev;
|
|
DWORD dwRet;
|
|
LPDDSURFACEDESC lpSurfaceDesc;
|
|
|
|
ppdev = (PDEV*) lpCanCreateSurface->lpDD->dhpdev;
|
|
lpSurfaceDesc = lpCanCreateSurface->lpDDSurfaceDesc;
|
|
|
|
dwRet = DDHAL_DRIVER_NOTHANDLED;
|
|
|
|
DISPDBG((2, "DdCanCreateSurface Entered"));
|
|
|
|
if (!lpCanCreateSurface->bIsDifferentPixelFormat)
|
|
{
|
|
// It's trivially easy to create plain surfaces that are the same
|
|
// type as the primary surface:
|
|
|
|
dwRet = DDHAL_DRIVER_HANDLED;
|
|
}
|
|
|
|
else if (ppdev->flStatus & STAT_STREAMS_ENABLED)
|
|
{
|
|
// When using the Streams processor, we handle only overlays of
|
|
// different pixel formats -- not any off-screen memory:
|
|
|
|
if (lpSurfaceDesc->ddsCaps.dwCaps & DDSCAPS_OVERLAY)
|
|
{
|
|
/*
|
|
* YUV Planar surfaces cannot co-exist with other overlay surfaces.
|
|
*/
|
|
if (ppdev->OvlyCnt >= 1)
|
|
{
|
|
lpCanCreateSurface->ddRVal = DDERR_OUTOFCAPS;
|
|
return (DDHAL_DRIVER_HANDLED);
|
|
}
|
|
if ((lpSurfaceDesc->ddpfPixelFormat.dwFourCC == FOURCC_YUVPLANAR) &&
|
|
ppdev->OvlyCnt)
|
|
{
|
|
lpCanCreateSurface->ddRVal = DDERR_INVALIDPIXELFORMAT;
|
|
return (DDHAL_DRIVER_HANDLED);
|
|
}
|
|
else if (ppdev->PlanarCnt)
|
|
{
|
|
lpCanCreateSurface->ddRVal = DDERR_INVALIDPIXELFORMAT;
|
|
return (DDHAL_DRIVER_HANDLED);
|
|
}
|
|
// We handle four types of YUV overlay surfaces:
|
|
|
|
if (lpSurfaceDesc->ddpfPixelFormat.dwFlags & DDPF_FOURCC)
|
|
{
|
|
// Check first for a supported YUV type:
|
|
|
|
if (lpSurfaceDesc->ddpfPixelFormat.dwFourCC == FOURCC_YUV422)
|
|
{
|
|
lpSurfaceDesc->ddpfPixelFormat.dwYUVBitCount = 16;
|
|
dwRet = DDHAL_DRIVER_HANDLED;
|
|
}
|
|
else if ((lpSurfaceDesc->ddpfPixelFormat.dwFourCC == FOURCC_YUY2) &&
|
|
((ppdev->ulChipID != 0x40) && (ppdev->ulChipID != 0x4C)) ) //tao1
|
|
{
|
|
lpSurfaceDesc->ddpfPixelFormat.dwYUVBitCount = 16;
|
|
dwRet = DDHAL_DRIVER_HANDLED;
|
|
}
|
|
else if (lpSurfaceDesc->ddpfPixelFormat.dwFourCC == FOURCC_PACKJR)
|
|
{
|
|
if( ppdev->cBitsPerPixel <= 16)
|
|
{
|
|
lpSurfaceDesc->ddpfPixelFormat.dwYUVBitCount = 8;
|
|
dwRet = DDHAL_DRIVER_HANDLED;
|
|
}
|
|
}
|
|
else if (lpSurfaceDesc->ddpfPixelFormat.dwFourCC == FOURCC_YUVPLANAR)
|
|
{
|
|
lpSurfaceDesc->ddpfPixelFormat.dwYUVBitCount = 8;
|
|
dwRet = DDHAL_DRIVER_HANDLED;
|
|
}
|
|
}
|
|
|
|
else if (lpSurfaceDesc->ddpfPixelFormat.dwFlags & DDPF_RGB)
|
|
{
|
|
if((lpSurfaceDesc->ddpfPixelFormat.dwFlags & DDPF_PALETTEINDEXED8) &&
|
|
ppdev->cBitsPerPixel == 16 )
|
|
{
|
|
dwRet = DDHAL_DRIVER_HANDLED;
|
|
}
|
|
else if (lpSurfaceDesc->ddpfPixelFormat.dwRGBBitCount == 16)
|
|
{
|
|
dwRet = DDHAL_DRIVER_HANDLED;
|
|
}
|
|
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
// Print some spew if this was a surface we refused to create:
|
|
|
|
if (dwRet == DDHAL_DRIVER_NOTHANDLED)
|
|
{
|
|
if (lpSurfaceDesc->ddpfPixelFormat.dwFlags & DDPF_RGB)
|
|
{
|
|
DISPDBG((0, "Failed creation of %libpp RGB surface %lx %lx %lx",
|
|
lpSurfaceDesc->ddpfPixelFormat.dwRGBBitCount,
|
|
lpSurfaceDesc->ddpfPixelFormat.dwRBitMask,
|
|
lpSurfaceDesc->ddpfPixelFormat.dwGBitMask,
|
|
lpSurfaceDesc->ddpfPixelFormat.dwBBitMask));
|
|
}
|
|
else
|
|
{
|
|
DISPDBG((0, "Failed creation of type 0x%lx YUV 0x%lx surface",
|
|
lpSurfaceDesc->ddpfPixelFormat.dwFlags,
|
|
lpSurfaceDesc->ddpfPixelFormat.dwFourCC));
|
|
}
|
|
}
|
|
|
|
|
|
lpCanCreateSurface->ddRVal = DD_OK;
|
|
return(dwRet);
|
|
}
|
|
|
|
/******************************Public*Routine******************************\
|
|
* DWORD DdCreateSurface
|
|
*
|
|
\**************************************************************************/
|
|
|
|
DWORD DdCreateSurface(
|
|
PDD_CREATESURFACEDATA lpCreateSurface)
|
|
{
|
|
PDEV* ppdev;
|
|
DD_SURFACE_LOCAL* lpSurfaceLocal;
|
|
DD_SURFACE_GLOBAL* lpSurfaceGlobal;
|
|
LPDDSURFACEDESC lpSurfaceDesc;
|
|
DWORD dwByteCount;
|
|
LONG lLinearPitch;
|
|
DWORD dwHeight;
|
|
|
|
ppdev = (PDEV*) lpCreateSurface->lpDD->dhpdev;
|
|
|
|
DISPDBG((2, "DdCreateSurface Entered"));
|
|
// On Windows NT, dwSCnt will always be 1, so there will only ever
|
|
// be one entry in the 'lplpSList' array:
|
|
|
|
lpSurfaceLocal = lpCreateSurface->lplpSList[0];
|
|
lpSurfaceGlobal = lpSurfaceLocal->lpGbl;
|
|
lpSurfaceDesc = lpCreateSurface->lpDDSurfaceDesc;
|
|
|
|
// We repeat the same checks we did in 'DdCanCreateSurface' because
|
|
// it's possible that an application doesn't call 'DdCanCreateSurface'
|
|
// before calling 'DdCreateSurface'.
|
|
|
|
ASSERTDD(lpSurfaceGlobal->ddpfSurface.dwSize == sizeof(DDPIXELFORMAT),
|
|
"NT is supposed to guarantee that ddpfSurface.dwSize is valid");
|
|
|
|
// DdCanCreateSurface already validated whether the hardware supports
|
|
// the surface, so we don't need to do any validation here. We'll
|
|
// just go ahead and allocate it.
|
|
//
|
|
// Note that we don't do anything special for RGB surfaces that are
|
|
// the same pixel format as the display -- by returning DDHAL_DRIVER_
|
|
// NOTHANDLED, DirectDraw will automatically handle the allocation
|
|
// for us.
|
|
//
|
|
// Also, since we'll be making linear surfaces, make sure the width
|
|
// isn't unreasonably large.
|
|
//
|
|
// Note that on NT, an overlay can be created only if the driver
|
|
// okay's it here in this routine. Under Win95, the overlay will be
|
|
// created automatically if it's the same pixel format as the primary
|
|
// display.
|
|
|
|
if ((lpSurfaceLocal->ddsCaps.dwCaps & DDSCAPS_OVERLAY) ||
|
|
(lpSurfaceGlobal->ddpfSurface.dwFlags & DDPF_FOURCC) ||
|
|
(lpSurfaceGlobal->ddpfSurface.dwRBitMask != ppdev->flRed))
|
|
{
|
|
if (lpSurfaceGlobal->wWidth <= (DWORD) ppdev->cxMemory)
|
|
{
|
|
|
|
lLinearPitch = (lpSurfaceGlobal->wWidth + 7) & ~7;
|
|
if (lpSurfaceGlobal->ddpfSurface.dwFlags & DDPF_FOURCC)
|
|
{
|
|
ASSERTDD((lpSurfaceGlobal->ddpfSurface.dwFourCC == FOURCC_YUV422) ||
|
|
(lpSurfaceGlobal->ddpfSurface.dwFourCC == FOURCC_YUY2) ||
|
|
(lpSurfaceGlobal->ddpfSurface.dwFourCC == FOURCC_PACKJR) ||
|
|
(lpSurfaceGlobal->ddpfSurface.dwFourCC == FOURCC_YUVPLANAR),
|
|
"Expected our DdCanCreateSurface to allow only UYVY, YUY2, CLPJ, CLPL");
|
|
if((lpSurfaceGlobal->ddpfSurface.dwFourCC == FOURCC_YUV422) ||
|
|
(lpSurfaceGlobal->ddpfSurface.dwFourCC == FOURCC_YUY2))
|
|
{
|
|
dwByteCount = 2;
|
|
lLinearPitch <<= 1;
|
|
lpSurfaceLocal->dwReserved1 |= OVERLAY_FLG_YUV422;
|
|
}
|
|
else if((lpSurfaceGlobal->ddpfSurface.dwFourCC == FOURCC_PACKJR))
|
|
{
|
|
dwByteCount = 1;
|
|
lpSurfaceLocal->dwReserved1 |= OVERLAY_FLG_PACKJR;
|
|
}
|
|
else if((lpSurfaceGlobal->ddpfSurface.dwFourCC == FOURCC_YUVPLANAR))
|
|
{
|
|
dwByteCount = 1;
|
|
lpSurfaceLocal->dwReserved1 |= OVERLAY_FLG_YUVPLANAR;
|
|
}
|
|
else
|
|
{
|
|
dwByteCount = 1;
|
|
DISPDBG((1, "Created RGB %libpp: %li x %li Red: %lx",
|
|
8 * dwByteCount, lpSurfaceGlobal->wWidth, lpSurfaceGlobal->wHeight,
|
|
lpSurfaceGlobal->ddpfSurface.dwRBitMask));
|
|
}
|
|
|
|
// We have to fill in the bit-count for FourCC surfaces:
|
|
|
|
lpSurfaceGlobal->ddpfSurface.dwYUVBitCount = 8 * dwByteCount;
|
|
lpSurfaceGlobal->ddpfSurface.dwYBitMask = (DWORD)-1;
|
|
lpSurfaceGlobal->ddpfSurface.dwUBitMask = (DWORD)-1;
|
|
lpSurfaceGlobal->ddpfSurface.dwVBitMask = (DWORD)-1;
|
|
|
|
DISPDBG((1, "Created YUV: %li x %li",
|
|
lpSurfaceGlobal->wWidth, lpSurfaceGlobal->wHeight));
|
|
}
|
|
else
|
|
{
|
|
dwByteCount = lpSurfaceGlobal->ddpfSurface.dwRGBBitCount >> 3;
|
|
|
|
|
|
if (dwByteCount == 2)
|
|
lLinearPitch <<= 1;
|
|
|
|
DISPDBG((1, "Created RGB %libpp: %li x %li Red: %lx",
|
|
8 * dwByteCount, lpSurfaceGlobal->wWidth, lpSurfaceGlobal->wHeight,
|
|
lpSurfaceGlobal->ddpfSurface.dwRBitMask));
|
|
|
|
}
|
|
|
|
// We want to allocate a linear surface to store the FourCC
|
|
// surface, but DirectDraw is using a 2-D heap-manager because
|
|
// the rest of our surfaces have to be 2-D. So here we have to
|
|
// convert the linear size to a 2-D size.
|
|
//
|
|
// The stride has to be a dword multiple:
|
|
|
|
dwHeight = (lpSurfaceGlobal->wHeight * lLinearPitch
|
|
+ ppdev->lDelta - 1) / ppdev->lDelta;
|
|
|
|
// Now fill in enough stuff to have the DirectDraw heap-manager
|
|
// do the allocation for us:
|
|
|
|
lpSurfaceGlobal->fpVidMem = DDHAL_PLEASEALLOC_BLOCKSIZE;
|
|
lpSurfaceGlobal->dwBlockSizeX = ppdev->lDelta; // Specified in bytes
|
|
lpSurfaceGlobal->dwBlockSizeY = dwHeight;
|
|
lpSurfaceGlobal->lPitch = lLinearPitch;
|
|
|
|
lpSurfaceDesc->lPitch = lLinearPitch;
|
|
lpSurfaceDesc->dwFlags |= DDSD_PITCH;
|
|
lpSurfaceLocal->dwReserved1 |= OVERLAY_FLG_OVERLAY;
|
|
if (lpSurfaceGlobal->ddpfSurface.dwFourCC == FOURCC_YUVPLANAR)
|
|
{
|
|
ppdev->PlanarCnt++;
|
|
}
|
|
else
|
|
{
|
|
ppdev->OvlyCnt++;
|
|
}
|
|
ppdev->fpBaseOverlay = 0xffffffff;
|
|
}
|
|
else
|
|
{
|
|
DISPDBG((1, "Refused to create surface with large width"));
|
|
}
|
|
}
|
|
|
|
return(DDHAL_DRIVER_NOTHANDLED);
|
|
}
|
|
|
|
/******************************Public*Routine******************************\
|
|
* DWORD DdDestroySurface
|
|
*
|
|
\**************************************************************************/
|
|
|
|
DWORD DdDestroySurface (PDD_DESTROYSURFACEDATA lpDestroySurface)
|
|
{
|
|
PDEV* ppdev;
|
|
BYTE* pjPorts;
|
|
|
|
ppdev = (PDEV*) lpDestroySurface->lpDD->dhpdev;
|
|
pjPorts = ppdev->pjPorts;
|
|
|
|
DISPDBG((2, "In DestroyOverlaySurface"));
|
|
if (lpDestroySurface->lpDDSurface->dwReserved1 & OVERLAY_FLG_ENABLED)
|
|
{
|
|
BYTE bTemp;
|
|
/*
|
|
* Turn the video off
|
|
*/
|
|
DISPDBG((1,"Turning off video in DestroySurface"));
|
|
ppdev->pfnDisableOverlay(ppdev);
|
|
ppdev->pfnClearAltFIFOThreshold(ppdev);
|
|
|
|
if (lpDestroySurface->lpDDSurface->dwReserved1 & OVERLAY_FLG_COLOR_KEY)
|
|
{
|
|
CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x1a);
|
|
bTemp = CP_IN_BYTE(pjPorts, CRTC_DATA); // Clear CR1A[3:2]
|
|
CP_OUT_BYTE(pjPorts, CRTC_DATA, bTemp & ~0x0C);
|
|
}
|
|
|
|
/*
|
|
* Turn off YUV Planar
|
|
*/
|
|
if (lpDestroySurface->lpDDSurface->dwReserved1 & OVERLAY_FLG_YUVPLANAR)
|
|
{
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, (0x00 << 8) | 0x3f); // Turn off YUV Planar
|
|
}
|
|
ppdev->fpVisibleOverlay = (FLATPTR)NULL;
|
|
|
|
ppdev->dwPanningFlag &= ~OVERLAY_OLAY_SHOW;
|
|
}
|
|
if (lpDestroySurface->lpDDSurface->dwReserved1 & OVERLAY_FLG_YUVPLANAR)
|
|
{
|
|
if (ppdev->PlanarCnt > 0)
|
|
ppdev->PlanarCnt--;
|
|
}
|
|
else
|
|
{
|
|
if (ppdev->OvlyCnt > 0)
|
|
ppdev->OvlyCnt--;
|
|
}
|
|
|
|
if (lpDestroySurface->lpDDSurface->ddsCaps.dwCaps & DDSCAPS_LIVEVIDEO)
|
|
{
|
|
BYTE bTemp;
|
|
CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x51);
|
|
bTemp= CP_IN_BYTE(pjPorts, CRTC_DATA);
|
|
CP_OUT_BYTE(pjPorts, CRTC_DATA, bTemp & ~0x08);
|
|
}
|
|
|
|
return(DDHAL_DRIVER_NOTHANDLED);
|
|
}
|
|
|
|
/******************************Public*Routine******************************\
|
|
* DWORD DdSetColorKey
|
|
*
|
|
\**************************************************************************/
|
|
|
|
DWORD DdSetColorKey(
|
|
PDD_SETCOLORKEYDATA lpSetColorKey)
|
|
{
|
|
PDEV* ppdev;
|
|
BYTE* pjPorts;
|
|
BYTE* pjBase;
|
|
DD_SURFACE_GLOBAL* lpSurface;
|
|
DWORD dwKeyLow;
|
|
DWORD dwKeyHigh;
|
|
|
|
ppdev = (PDEV*) lpSetColorKey->lpDD->dhpdev;
|
|
|
|
DISPDBG((2, "DdSetColorKey Entered"));
|
|
|
|
ASSERTDD(ppdev->flStatus & STAT_STREAMS_ENABLED, "Shouldn't have hooked call");
|
|
|
|
pjPorts = ppdev->pjPorts;
|
|
pjBase = ppdev->pjBase;
|
|
lpSurface = lpSetColorKey->lpDDSurface->lpGbl;
|
|
|
|
// We don't have to do anything for normal blt source colour keys:
|
|
|
|
if (lpSetColorKey->dwFlags & DDCKEY_SRCBLT)
|
|
{
|
|
lpSetColorKey->ddRVal = DD_OK;
|
|
return(DDHAL_DRIVER_HANDLED);
|
|
}
|
|
else if ((lpSetColorKey->dwFlags & DDCKEY_DESTOVERLAY) &&
|
|
(lpSetColorKey->lpDDSurface == ppdev->lpColorSurface))
|
|
{
|
|
if (lpSurface->fpVidMem == ppdev->fpVisibleOverlay)
|
|
{
|
|
ppdev->wColorKey = (WORD) lpSetColorKey->ckNew.dwColorSpaceLowValue;
|
|
ppdev->pfnRegInitVideo(ppdev, lpSetColorKey->lpDDSurface);
|
|
}
|
|
lpSetColorKey->ddRVal = DD_OK;
|
|
return(DDHAL_DRIVER_HANDLED);
|
|
}
|
|
else if ((lpSetColorKey->dwFlags & DDCKEY_SRCOVERLAY) &&
|
|
(lpSetColorKey->lpDDSurface == ppdev->lpSrcColorSurface))
|
|
{
|
|
if (lpSurface->fpVidMem == ppdev->fpVisibleOverlay)
|
|
{
|
|
ppdev->dwSrcColorKeyLow = lpSetColorKey->ckNew.dwColorSpaceLowValue;
|
|
ppdev->dwSrcColorKeyHigh = lpSetColorKey->ckNew.dwColorSpaceHighValue;
|
|
if (ppdev->dwSrcColorKeyLow > ppdev->dwSrcColorKeyHigh)
|
|
{
|
|
ppdev->dwSrcColorKeyHigh = ppdev->dwSrcColorKeyLow;
|
|
}
|
|
ppdev->pfnRegInitVideo(ppdev, lpSetColorKey->lpDDSurface);
|
|
}
|
|
lpSetColorKey->ddRVal = DD_OK;
|
|
return(DDHAL_DRIVER_HANDLED);
|
|
}
|
|
|
|
DISPDBG((1, "DdSetColorKey: Invalid command"));
|
|
return(DDHAL_DRIVER_NOTHANDLED);
|
|
}
|
|
|
|
/******************************Public*Routine******************************\
|
|
* DWORD DdUpdateOverlay
|
|
*
|
|
\**************************************************************************/
|
|
|
|
DWORD DdUpdateOverlay(
|
|
PDD_UPDATEOVERLAYDATA lpUpdateOverlay)
|
|
{
|
|
PDEV* ppdev;
|
|
BYTE* pjPorts;
|
|
BYTE* pjBase;
|
|
DD_SURFACE_GLOBAL* lpSource;
|
|
DD_SURFACE_GLOBAL* lpDestination;
|
|
DWORD dwStride;
|
|
LONG srcWidth;
|
|
LONG srcHeight;
|
|
LONG dstWidth;
|
|
LONG dstHeight;
|
|
DWORD dwBitCount;
|
|
DWORD dwStart;
|
|
DWORD dwTmp;
|
|
BOOL bColorKey;
|
|
DWORD dwKeyLow;
|
|
DWORD dwKeyHigh;
|
|
DWORD dwBytesPerPixel;
|
|
|
|
DWORD dwSecCtrl;
|
|
DWORD dwBlendCtrl;
|
|
|
|
DWORD dwFourcc;
|
|
BOOL bCheckBandwidth;
|
|
WORD wBitCount;
|
|
DWORD_PTR dwOldStatus;
|
|
BYTE bTemp;
|
|
|
|
ppdev = (PDEV*) lpUpdateOverlay->lpDD->dhpdev;
|
|
|
|
DISPDBG((2, "DdUpdateOverlay Entered"));
|
|
ASSERTDD(ppdev->flStatus & STAT_STREAMS_ENABLED, "Shouldn't have hooked call");
|
|
|
|
pjPorts = ppdev->pjPorts;
|
|
pjBase = ppdev->pjBase;
|
|
|
|
//myf33 begin
|
|
// Initialize the bandwidth registers
|
|
Regs.bSR2F = 0;
|
|
Regs.bSR32 = 0;
|
|
Regs.bSR34 = 0;
|
|
Regs.bCR42 = 0;
|
|
//myf33 end
|
|
|
|
if (lpUpdateOverlay->lpDDSrcSurface->dwFlags & DDRAWISURF_HASPIXELFORMAT)
|
|
{
|
|
GetFormatInfo(ppdev, &(lpUpdateOverlay->lpDDSrcSurface->lpGbl->ddpfSurface),
|
|
&dwFourcc, &wBitCount);
|
|
}
|
|
else
|
|
{
|
|
// This needs to be changed when primary surface is RGB 5:6:5
|
|
dwFourcc = BI_RGB;
|
|
wBitCount = (WORD) ppdev->cBitsPerPixel;
|
|
}
|
|
|
|
/*
|
|
* Are we color keying?
|
|
*/
|
|
bCheckBandwidth = TRUE;
|
|
ppdev->lpColorSurface = ppdev->lpSrcColorSurface = NULL;
|
|
dwOldStatus = lpUpdateOverlay->lpDDSrcSurface->dwReserved1;
|
|
if ((lpUpdateOverlay->dwFlags & (DDOVER_KEYDEST | DDOVER_KEYDESTOVERRIDE)) &&
|
|
(lpUpdateOverlay->dwFlags & (DDOVER_KEYSRC | DDOVER_KEYSRCOVERRIDE)))
|
|
{
|
|
/*
|
|
* Cannot perform src colorkey and dest colorkey at the same time
|
|
*/
|
|
lpUpdateOverlay->ddRVal = DDERR_NOCOLORKEYHW;
|
|
return (DDHAL_DRIVER_HANDLED);
|
|
}
|
|
lpUpdateOverlay->lpDDSrcSurface->dwReserved1 &= ~(OVERLAY_FLG_COLOR_KEY|OVERLAY_FLG_SRC_COLOR_KEY);
|
|
if (lpUpdateOverlay->dwFlags & (DDOVER_KEYDEST | DDOVER_KEYDESTOVERRIDE))
|
|
{
|
|
if (ppdev->pfnIsSufficientBandwidth(ppdev, wBitCount, &(lpUpdateOverlay->rSrc),
|
|
&(lpUpdateOverlay->rDest), OVERLAY_FLG_COLOR_KEY))
|
|
{
|
|
bCheckBandwidth = FALSE;
|
|
lpUpdateOverlay->lpDDSrcSurface->dwReserved1 |= OVERLAY_FLG_COLOR_KEY;
|
|
if (lpUpdateOverlay->dwFlags & DDOVER_KEYDEST)
|
|
{
|
|
ppdev->wColorKey = (WORD)
|
|
lpUpdateOverlay->lpDDDestSurface->ddckCKDestOverlay.dwColorSpaceLowValue;
|
|
ppdev->lpColorSurface = lpUpdateOverlay->lpDDDestSurface;
|
|
}
|
|
else
|
|
{
|
|
ppdev->wColorKey = (WORD)
|
|
lpUpdateOverlay->overlayFX.dckDestColorkey.dwColorSpaceLowValue;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
lpUpdateOverlay->ddRVal = DDERR_NOCOLORKEYHW;
|
|
return (DDHAL_DRIVER_HANDLED);
|
|
}
|
|
}
|
|
else if (lpUpdateOverlay->dwFlags & (DDOVER_KEYSRC | DDOVER_KEYSRCOVERRIDE))
|
|
{
|
|
if (ppdev->pfnIsSufficientBandwidth(ppdev, wBitCount, &(lpUpdateOverlay->rSrc),
|
|
&(lpUpdateOverlay->rDest), OVERLAY_FLG_SRC_COLOR_KEY))
|
|
{
|
|
bCheckBandwidth = FALSE;
|
|
lpUpdateOverlay->lpDDSrcSurface->dwReserved1 |= OVERLAY_FLG_SRC_COLOR_KEY;
|
|
ppdev->lpSrcColorSurface = lpUpdateOverlay->lpDDSrcSurface;
|
|
if (lpUpdateOverlay->dwFlags & DDOVER_KEYSRC)
|
|
{
|
|
ppdev->dwSrcColorKeyLow =
|
|
lpUpdateOverlay->lpDDSrcSurface->ddckCKSrcOverlay.dwColorSpaceLowValue;
|
|
ppdev->dwSrcColorKeyHigh =
|
|
lpUpdateOverlay->lpDDSrcSurface->ddckCKSrcOverlay.dwColorSpaceHighValue;
|
|
}
|
|
else
|
|
{
|
|
ppdev->dwSrcColorKeyLow =
|
|
lpUpdateOverlay->overlayFX.dckSrcColorkey.dwColorSpaceLowValue;
|
|
ppdev->dwSrcColorKeyHigh =
|
|
lpUpdateOverlay->overlayFX.dckSrcColorkey.dwColorSpaceHighValue;
|
|
}
|
|
if (ppdev->dwSrcColorKeyHigh < ppdev->dwSrcColorKeyHigh)
|
|
{
|
|
ppdev->dwSrcColorKeyHigh = ppdev->dwSrcColorKeyLow;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
DISPDBG((0, "Insufficient bandwidth for colorkeying"));
|
|
lpUpdateOverlay->ddRVal = DDERR_NOCOLORKEYHW;
|
|
return (DDHAL_DRIVER_HANDLED);
|
|
}
|
|
}
|
|
|
|
// 'Source' is the overlay surface, 'destination' is the surface to
|
|
// be overlayed:
|
|
|
|
lpSource = lpUpdateOverlay->lpDDSrcSurface->lpGbl;
|
|
|
|
if (lpUpdateOverlay->dwFlags & DDOVER_HIDE)
|
|
{
|
|
if (lpSource->fpVidMem == ppdev->fpVisibleOverlay)
|
|
{
|
|
/*
|
|
* Turn the video off
|
|
*/
|
|
ppdev->pfnDisableOverlay(ppdev);
|
|
ppdev->pfnClearAltFIFOThreshold(ppdev);
|
|
|
|
/*
|
|
* If we are color keying, we will disable that now
|
|
*/
|
|
if (dwOldStatus & OVERLAY_FLG_COLOR_KEY)
|
|
{
|
|
CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x1a);
|
|
bTemp = CP_IN_BYTE(pjPorts, CRTC_DATA); // Clear CR1A[3:2]
|
|
CP_OUT_BYTE(pjPorts, CRTC_DATA, bTemp & ~0x0C);
|
|
}
|
|
|
|
ppdev->dwPanningFlag &= ~OVERLAY_OLAY_SHOW;
|
|
lpUpdateOverlay->lpDDSrcSurface->dwReserved1 &= ~OVERLAY_FLG_ENABLED;
|
|
ppdev->fpVisibleOverlay = 0;
|
|
}
|
|
|
|
lpUpdateOverlay->ddRVal = DD_OK;
|
|
return(DDHAL_DRIVER_HANDLED);
|
|
}
|
|
// Dereference 'lpDDDestSurface' only after checking for the DDOVER_HIDE
|
|
// case:
|
|
#if 0
|
|
/*
|
|
* Turn the video off first to protect side effect when moving.
|
|
* Later RegIniVideo will turn it on if needed.
|
|
*/
|
|
CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x3e);
|
|
bTemp = CP_IN_BYTE(pjPorts, CRTC_DATA);
|
|
CP_OUT_BYTE(pjPorts, CRTC_DATA, bTemp & ~0x01); // Clear CR3E[0]
|
|
#endif
|
|
|
|
lpDestination = lpUpdateOverlay->lpDDDestSurface->lpGbl;
|
|
|
|
if (lpSource->fpVidMem != ppdev->fpVisibleOverlay)
|
|
{
|
|
if (lpUpdateOverlay->dwFlags & DDOVER_SHOW)
|
|
{
|
|
if (ppdev->fpVisibleOverlay != 0)
|
|
{
|
|
// Some other overlay is already visible:
|
|
|
|
DISPDBG((0, "DdUpdateOverlay: An overlay is already visible"));
|
|
|
|
lpUpdateOverlay->ddRVal = DDERR_OUTOFCAPS;
|
|
return(DDHAL_DRIVER_HANDLED);
|
|
}
|
|
else
|
|
{
|
|
// We're going to make the overlay visible, so mark it as
|
|
// such:
|
|
|
|
ppdev->fpVisibleOverlay = lpSource->fpVidMem;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
// The overlay isn't visible, and we haven't been asked to make
|
|
// it visible, so this call is trivially easy:
|
|
|
|
lpUpdateOverlay->ddRVal = DD_OK;
|
|
return(DDHAL_DRIVER_HANDLED);
|
|
}
|
|
}
|
|
|
|
/*
|
|
* Is there sufficient bandwidth to work?
|
|
*/
|
|
if (bCheckBandwidth && !ppdev->pfnIsSufficientBandwidth(ppdev, wBitCount,
|
|
&(lpUpdateOverlay->rSrc), &(lpUpdateOverlay->rDest), 0))
|
|
{
|
|
lpUpdateOverlay->ddRVal = DDERR_OUTOFCAPS;
|
|
return (DDHAL_DRIVER_HANDLED);
|
|
}
|
|
|
|
/*
|
|
* Save the rectangles
|
|
*/
|
|
ppdev->rOverlaySrc = lpUpdateOverlay->rSrc;
|
|
ppdev->rOverlayDest = lpUpdateOverlay->rDest;
|
|
|
|
if (lpUpdateOverlay->lpDDSrcSurface->dwReserved1 & OVERLAY_FLG_DECIMATE)
|
|
{
|
|
ppdev->rOverlaySrc.right = ppdev->rOverlaySrc.left +
|
|
((ppdev->rOverlaySrc.right - ppdev->rOverlaySrc.left) >> 1);
|
|
}
|
|
|
|
if (ppdev->rOverlaySrc.right - ppdev->rOverlaySrc.left <= MIN_OLAY_WIDTH)
|
|
{
|
|
lpUpdateOverlay->ddRVal = DDERR_OUTOFCAPS;
|
|
return (DDHAL_DRIVER_HANDLED);
|
|
}
|
|
|
|
lpUpdateOverlay->lpDDSrcSurface->dwReserved1 |= OVERLAY_FLG_ENABLED;
|
|
|
|
//
|
|
// Assign 5c to 1F when video is on while no color key for 5446BE.
|
|
//
|
|
// sge04
|
|
//if (bCheckBandwidth && ppdev->flCaps & CAPS_SECOND_APERTURE)
|
|
if (ppdev->flCaps & CAPS_SECOND_APERTURE)
|
|
ppdev->lFifoThresh = 0x0E;
|
|
|
|
ppdev->pfnRegInitVideo(ppdev, lpUpdateOverlay->lpDDSrcSurface);
|
|
|
|
lpUpdateOverlay->ddRVal = DD_OK;
|
|
return(DDHAL_DRIVER_HANDLED);
|
|
}
|
|
|
|
/******************************Public*Routine******************************\
|
|
* DWORD DdSetOverlayPosition
|
|
*
|
|
\**************************************************************************/
|
|
|
|
DWORD DdSetOverlayPosition(
|
|
PDD_SETOVERLAYPOSITIONDATA lpSetOverlayPosition)
|
|
{
|
|
PDEV* ppdev;
|
|
BYTE* pjPorts;
|
|
BYTE* pjBase;
|
|
|
|
ppdev = (PDEV*) lpSetOverlayPosition->lpDD->dhpdev;
|
|
pjPorts = ppdev->pjPorts;
|
|
pjBase = ppdev->pjBase;
|
|
|
|
DISPDBG((2, "DdSetOverlayPosition Entered"));
|
|
ASSERTDD(ppdev->flStatus & STAT_STREAMS_ENABLED, "Shouldn't have hooked call");
|
|
|
|
if(lpSetOverlayPosition->lpDDSrcSurface->lpGbl->fpVidMem == ppdev->fpVisibleOverlay)
|
|
{
|
|
/*
|
|
* Update the rectangles
|
|
*/
|
|
ppdev->rOverlayDest.right = (ppdev->rOverlayDest.right - ppdev->rOverlayDest.left)
|
|
+ lpSetOverlayPosition->lXPos;
|
|
ppdev->rOverlayDest.left = lpSetOverlayPosition->lXPos;
|
|
ppdev->rOverlayDest.bottom = (ppdev->rOverlayDest.bottom - ppdev->rOverlayDest.top)
|
|
+ lpSetOverlayPosition->lYPos;
|
|
ppdev->rOverlayDest.top = lpSetOverlayPosition->lYPos;
|
|
|
|
//myf29 RegMoveVideo(ppdev, lpSetOverlayPosition->lpDDSrcSurface);
|
|
ppdev->pfnRegMoveVideo(ppdev, lpSetOverlayPosition->lpDDSrcSurface);
|
|
}
|
|
|
|
lpSetOverlayPosition->ddRVal = DD_OK;
|
|
return(DDHAL_DRIVER_HANDLED);
|
|
}
|
|
|
|
|
|
/******************************************************************************\
|
|
*
|
|
* Function: DrvGetDirectDrawInfo
|
|
*
|
|
* This function returns te capabilities of the DirectDraw implementation. It is
|
|
* called twice during the connect phase.
|
|
*
|
|
* Parameters: dhpdev Handle to physical device.
|
|
* pHalInfo Pointer to a DD_HALINFO structure.
|
|
* pdwNumHeaps Pointer to a variable that holds the number of
|
|
* heaps.
|
|
* pvmList Pointer to the heap array.
|
|
* pdwNumFourCC Pointer to a variable that holds the number of
|
|
* FourCC IDs.
|
|
* pdwFourCC Pointer to FourCC IDs.
|
|
*
|
|
* Returns: TRUE if successful.
|
|
*
|
|
\******************************************************************************/
|
|
BOOL DrvGetDirectDrawInfo(
|
|
DHPDEV dhpdev,
|
|
DD_HALINFO* pHalInfo,
|
|
DWORD* pdwNumHeaps,
|
|
VIDEOMEMORY* pvmList,
|
|
DWORD* pdwNumFourCC,
|
|
DWORD* pdwFourCC)
|
|
{
|
|
BOOL bCanFlip;
|
|
PDEV* ppdev = (PPDEV) dhpdev;
|
|
LONGLONG li;
|
|
OH* poh;
|
|
RECTL rSrc, rDest;
|
|
LONG lZoom;
|
|
BYTE* pjPorts = ppdev->pjPorts;
|
|
BYTE bTemp;
|
|
|
|
// We may not support DirectDraw on this card.
|
|
if (!(ppdev->flStatus & STAT_DIRECTDRAW))
|
|
{
|
|
return(FALSE);
|
|
}
|
|
|
|
DISPDBG((2, "DrvGetDirectDrawInfo Entered"));
|
|
pHalInfo->dwSize = sizeof(DD_HALINFO);
|
|
|
|
// Current primary surface attributes. Since HalInfo is zero-initialized by
|
|
// GDI, we only have to fill in the fields which should be non-zero.
|
|
|
|
pHalInfo->vmiData.pvPrimary = ppdev->pjScreen;
|
|
pHalInfo->vmiData.dwDisplayWidth = ppdev->cxScreen;
|
|
pHalInfo->vmiData.dwDisplayHeight = ppdev->cyScreen;
|
|
pHalInfo->vmiData.lDisplayPitch = ppdev->lDelta;
|
|
pHalInfo->vmiData.dwOffscreenAlign = 4;
|
|
|
|
pHalInfo->vmiData.ddpfDisplay.dwSize = sizeof(DDPIXELFORMAT);
|
|
pHalInfo->vmiData.ddpfDisplay.dwFlags = DDPF_RGB;
|
|
|
|
pHalInfo->vmiData.ddpfDisplay.dwRGBBitCount = ppdev->cBitsPerPixel;
|
|
|
|
if (ppdev->cBpp == 1)
|
|
{
|
|
pHalInfo->vmiData.ddpfDisplay.dwFlags |= DDPF_PALETTEINDEXED8;
|
|
}
|
|
|
|
// These masks will be zero at 8bpp.
|
|
pHalInfo->vmiData.ddpfDisplay.dwRBitMask = ppdev->flRed;
|
|
pHalInfo->vmiData.ddpfDisplay.dwGBitMask = ppdev->flGreen;
|
|
pHalInfo->vmiData.ddpfDisplay.dwBBitMask = ppdev->flBlue;
|
|
|
|
if (ppdev->cBpp == 4)
|
|
{
|
|
pHalInfo->vmiData.ddpfDisplay.dwRGBAlphaBitMask =
|
|
~(ppdev->flRed | ppdev->flGreen | ppdev->flBlue);
|
|
}
|
|
|
|
// Set up the pointer to the first available video memory after the primary
|
|
// surface.
|
|
bCanFlip = FALSE;
|
|
*pdwNumHeaps = 0;
|
|
|
|
// Free up as much off-screen memory as possible.
|
|
bMoveAllDfbsFromOffscreenToDibs(ppdev); // Move all DFBs to DIB.s
|
|
vAssertModeText(ppdev, FALSE); // Destroy all cached fonts.
|
|
|
|
if ((ppdev->ulChipID == CL7555_ID) || (ppdev->ulChipID == CL7556_ID))//myf32
|
|
{
|
|
MIN_OLAY_WIDTH = 16;
|
|
#if (_WIN32_WINNT >= 0x0400)
|
|
ppdev->flCaps |= CAPS_VIDEO;
|
|
#endif
|
|
ppdev->pfnIsSufficientBandwidth=Is7555SufficientBandwidth;
|
|
ppdev->pfnRegInitVideo=RegInit7555Video;
|
|
ppdev->pfnRegMoveVideo=RegMove7555Video;
|
|
ppdev->pfnDisableOverlay=DisableVideoWindow;
|
|
ppdev->pfnClearAltFIFOThreshold=ClearAltFIFOThreshold;
|
|
}
|
|
else
|
|
{
|
|
ppdev->pfnIsSufficientBandwidth =
|
|
(ppdev->ulChipID != 0xBC) ?
|
|
IsSufficientBandwidth : Is5480SufficientBandwidth ; // chu03
|
|
|
|
ppdev->pfnRegInitVideo=RegInitVideo;
|
|
ppdev->pfnRegMoveVideo=RegMoveVideo;
|
|
ppdev->pfnDisableOverlay=DisableOverlay_544x;
|
|
ppdev->pfnClearAltFIFOThreshold=ClearAltFIFOThreshold_544x;
|
|
}
|
|
|
|
// Now simply reserve the biggest chunk for use by DirectDraw.
|
|
poh = ppdev->pohDirectDraw;
|
|
#if (DIRECTX_24 < 2)
|
|
if ((poh == NULL) && (ppdev->cBpp != 3))
|
|
#else
|
|
if (poh == NULL)
|
|
#endif
|
|
{
|
|
LONG cxMax, cyMax;
|
|
|
|
cxMax = ppdev->heap.cxMax & ~(HEAP_X_ALIGNMENT - 1);
|
|
cyMax = ppdev->heap.cyMax;
|
|
|
|
poh = pohAllocatePermanent(ppdev, cxMax, cyMax);
|
|
if (poh == NULL)
|
|
{
|
|
// Could not allocate all memory, find the biggest area now.
|
|
cxMax = cyMax = 0;
|
|
for (poh = ppdev->heap.ohAvailable.pohNext;
|
|
poh != &ppdev->heap.ohAvailable; poh = poh->pohNext)
|
|
{
|
|
if ((poh->cx * poh->cy) > (cxMax * cyMax))
|
|
{
|
|
cxMax = poh->cx & ~(HEAP_X_ALIGNMENT - 1);
|
|
cyMax = poh->cy;
|
|
}
|
|
}
|
|
|
|
poh = pohAllocatePermanent(ppdev, cxMax, cyMax);
|
|
}
|
|
|
|
ppdev->pohDirectDraw = poh;
|
|
}
|
|
|
|
if (poh != NULL)
|
|
{
|
|
*pdwNumHeaps = 1;
|
|
|
|
// Fill in the list of off-screen rectangles if we've been asked to do
|
|
// so.
|
|
if (pvmList != NULL)
|
|
{
|
|
DISPDBG((1, "DirectDraw gets %d x %d surface at (%d, %d)",
|
|
poh->cx, poh->cy, poh->x, poh->y));
|
|
|
|
#if 0
|
|
if (PELS_TO_BYTES(poh->cx) != ppdev->lDelta)
|
|
{
|
|
#endif
|
|
pvmList->dwFlags = VIDMEM_ISRECTANGULAR;
|
|
pvmList->fpStart = poh->xy;
|
|
pvmList->dwWidth = PELS_TO_BYTES(poh->cx);
|
|
pvmList->dwHeight = poh->cy;
|
|
#if 0
|
|
}
|
|
else
|
|
{
|
|
pvmList->dwFlags = VIDMEM_ISLINEAR;
|
|
pvmList->fpStart = poh->xy;
|
|
pvmList->fpEnd = poh->xy - 1
|
|
+ PELS_TO_BYTES(poh->cx)
|
|
+ poh->cy * ppdev->lDelta;
|
|
}
|
|
#endif
|
|
|
|
pvmList->ddsCaps.dwCaps = DDSCAPS_OFFSCREENPLAIN;
|
|
if ((poh->cx >= ppdev->cxScreen) && (poh->cy >= ppdev->cyScreen))
|
|
{
|
|
bCanFlip = TRUE;
|
|
}
|
|
}
|
|
}
|
|
|
|
// Capabilities supported.
|
|
pHalInfo->ddCaps.dwFXCaps = 0;
|
|
pHalInfo->ddCaps.dwCaps = DDCAPS_BLT
|
|
| DDCAPS_BLTCOLORFILL
|
|
| DDCAPS_READSCANLINE; // sge08 add this bit
|
|
|
|
pHalInfo->ddCaps.dwCaps2 = DDCAPS2_COPYFOURCC;
|
|
|
|
if ( (ppdev->flCaps & CAPS_VIDEO) && (ppdev->cBpp <= 2) )
|
|
{
|
|
pHalInfo->ddCaps.dwCaps |= DDCAPS_COLORKEY;
|
|
pHalInfo->ddCaps.dwCKeyCaps = DDCKEYCAPS_SRCBLT;
|
|
}
|
|
|
|
pHalInfo->ddCaps.ddsCaps.dwCaps = DDSCAPS_OFFSCREENPLAIN
|
|
| DDSCAPS_PRIMARYSURFACE;
|
|
if (bCanFlip)
|
|
{
|
|
pHalInfo->ddCaps.ddsCaps.dwCaps |= DDSCAPS_FLIP;
|
|
}
|
|
|
|
// FourCCs supported.
|
|
*pdwNumFourCC = 0;
|
|
|
|
#if 0 // smac - disable overlays due to too many bugs
|
|
{
|
|
|
|
//
|
|
// Interlaced mode ?
|
|
//
|
|
BOOL Interlaced ; // chu02
|
|
|
|
CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x1a) ;
|
|
Interlaced = CP_IN_BYTE(pjPorts, CRTC_DATA) & 0x01 ;
|
|
|
|
//
|
|
// Needs check more later
|
|
//
|
|
if ((ppdev->flCaps & CAPS_VIDEO) && (!Interlaced)) // chu02
|
|
ppdev->flStatus |= STAT_STREAMS_ENABLED;
|
|
|
|
if (ppdev->flStatus & STAT_STREAMS_ENABLED)
|
|
{
|
|
|
|
/*
|
|
* Are we double clocked?
|
|
*/
|
|
ppdev->bDoubleClock = FALSE;
|
|
//
|
|
// use SR7 to check the double clock instead of hidden register
|
|
//
|
|
//
|
|
CP_OUT_BYTE(pjPorts, SR_INDEX, 0x7);
|
|
bTemp = CP_IN_BYTE(pjPorts, SR_DATA);
|
|
|
|
if ((((bTemp & 0x0E) == 0x06) && ppdev->cBitsPerPixel == 8) ||
|
|
(((bTemp & 0x0E) == 0x08) && ppdev->cBitsPerPixel == 16))
|
|
{
|
|
ppdev->bDoubleClock = TRUE;
|
|
}
|
|
|
|
pHalInfo->vmiData.dwOverlayAlign = 8;
|
|
|
|
pHalInfo->ddCaps.dwCaps |= DDCAPS_OVERLAY
|
|
| DDCAPS_OVERLAYSTRETCH
|
|
| DDCAPS_OVERLAYFOURCC
|
|
| DDCAPS_OVERLAYCANTCLIP
|
|
| DDCAPS_ALIGNSTRIDE;
|
|
|
|
pHalInfo->ddCaps.dwFXCaps |= DDFXCAPS_OVERLAYSTRETCHX
|
|
| DDFXCAPS_OVERLAYSTRETCHY
|
|
| DDFXCAPS_OVERLAYARITHSTRETCHY;
|
|
|
|
pHalInfo->ddCaps.dwCKeyCaps |= DDCKEYCAPS_DESTOVERLAY
|
|
| DDCKEYCAPS_DESTOVERLAYYUV
|
|
| DDCKEYCAPS_DESTOVERLAYONEACTIVE;
|
|
|
|
pHalInfo->ddCaps.dwCKeyCaps |= DDCKEYCAPS_SRCOVERLAY
|
|
| DDCKEYCAPS_SRCOVERLAYCLRSPACE
|
|
| DDCKEYCAPS_SRCOVERLAYCLRSPACEYUV
|
|
| DDCKEYCAPS_SRCOVERLAYONEACTIVE
|
|
| DDCKEYCAPS_SRCOVERLAYYUV;
|
|
|
|
pHalInfo->ddCaps.ddsCaps.dwCaps |= DDSCAPS_OVERLAY;
|
|
|
|
*pdwNumFourCC = 3;
|
|
if ((ppdev->ulChipID == 0x40) || (ppdev->ulChipID == 0x4C)) //tao1
|
|
*pdwNumFourCC = 2; //tao1
|
|
|
|
if (pdwFourCC)
|
|
{
|
|
pdwFourCC[0] = FOURCC_YUV422;
|
|
pdwFourCC[1] = FOURCC_PACKJR;
|
|
if ((ppdev->ulChipID != 0x40) && (ppdev->ulChipID != 0x4C)) //tao1
|
|
pdwFourCC[2] = FOURCC_YUY2; //tao1
|
|
}
|
|
|
|
pHalInfo->ddCaps.dwMaxVisibleOverlays = 1;
|
|
pHalInfo->ddCaps.dwCurrVisibleOverlays = 0;
|
|
pHalInfo->ddCaps.dwNumFourCCCodes = 2;
|
|
# if 1
|
|
pHalInfo->ddCaps.dwAlignBoundarySrc = 1;
|
|
pHalInfo->ddCaps.dwAlignSizeSrc = 1;
|
|
// chu01 sge05
|
|
#if 1
|
|
if ((ppdev->cBpp == 3) || ppdev->bDoubleClock )
|
|
{
|
|
pHalInfo->ddCaps.dwAlignBoundaryDest = 4;
|
|
pHalInfo->ddCaps.dwAlignSizeDest = 4;
|
|
}
|
|
else
|
|
{
|
|
pHalInfo->ddCaps.dwAlignBoundaryDest = 1;
|
|
pHalInfo->ddCaps.dwAlignSizeDest = 1;
|
|
}
|
|
#else
|
|
pHalInfo->ddCaps.dwAlignBoundaryDest = 1;
|
|
pHalInfo->ddCaps.dwAlignSizeDest = 1;
|
|
#endif // 1
|
|
pHalInfo->ddCaps.dwAlignStrideAlign = 8;
|
|
pHalInfo->ddCaps.dwMinOverlayStretch = 8000;
|
|
pHalInfo->ddCaps.dwMinLiveVideoStretch = 8000;
|
|
pHalInfo->ddCaps.dwMinHwCodecStretch = 8000;
|
|
pHalInfo->ddCaps.dwMaxOverlayStretch = 8000;
|
|
pHalInfo->ddCaps.dwMaxLiveVideoStretch = 8000;
|
|
pHalInfo->ddCaps.dwMaxHwCodecStretch = 8000;
|
|
//
|
|
// maybe there are special requirement for VCLK > 85Hz
|
|
//
|
|
#endif
|
|
rSrc.left = rSrc.top = 0;
|
|
rSrc.right = 320;
|
|
rSrc.bottom = 240;
|
|
rDest.left = rDest.top = 0;
|
|
rDest.right = 1280;
|
|
rDest.bottom = 960;
|
|
lZoom = 1000;
|
|
do
|
|
{
|
|
rDest.right = (320 * lZoom)/ 1000;
|
|
rDest.bottom = (240 * lZoom)/1000;
|
|
if (ppdev->pfnIsSufficientBandwidth(ppdev, 16, (LPRECTL) &rSrc, (LPRECTL) &rDest, 0))
|
|
{
|
|
DISPDBG((1, "Minimum zoom factor: %d", lZoom));
|
|
pHalInfo->ddCaps.dwMinOverlayStretch = lZoom;
|
|
pHalInfo->ddCaps.dwMinLiveVideoStretch = lZoom;
|
|
pHalInfo->ddCaps.dwMinHwCodecStretch = lZoom;
|
|
lZoom = 4000;
|
|
}
|
|
lZoom += 100;
|
|
} while (lZoom < 4000);
|
|
}
|
|
}
|
|
#endif // smac
|
|
|
|
return(TRUE);
|
|
}
|
|
|
|
|
|
/******************************************************************************\
|
|
*
|
|
* Function: DrvEnableDirectDraw
|
|
*
|
|
* Enable DirectDraw. This function is called when an application opens a
|
|
* DirectDraw connection.
|
|
*
|
|
* Parameters: dhpdev Handle to physical device.
|
|
* pCallBacks Pointer to DirectDraw callbacks.
|
|
* pSurfaceCallBacks Pointer to surface callbacks.
|
|
* pPaletteCallBacks Pointer to palette callbacks.
|
|
*
|
|
* Returns: TRUE if successful.
|
|
*
|
|
\******************************************************************************/
|
|
BOOL DrvEnableDirectDraw(
|
|
DHPDEV dhpdev,
|
|
DD_CALLBACKS* pCallBacks,
|
|
DD_SURFACECALLBACKS* pSurfaceCallBacks,
|
|
DD_PALETTECALLBACKS* pPaletteCallBacks)
|
|
{
|
|
PDEV* ppdev = (PPDEV) dhpdev;
|
|
|
|
pCallBacks->WaitForVerticalBlank = DdWaitForVerticalBlank;
|
|
pCallBacks->MapMemory = DdMapMemory;
|
|
pCallBacks->GetScanLine = DdGetScanLine;
|
|
pCallBacks->dwFlags = DDHAL_CB32_WAITFORVERTICALBLANK
|
|
| DDHAL_CB32_MAPMEMORY
|
|
| DDHAL_CB32_GETSCANLINE;
|
|
|
|
pSurfaceCallBacks->Blt = DdBlt;
|
|
pSurfaceCallBacks->Flip = DdFlip;
|
|
pSurfaceCallBacks->Lock = DdLock;
|
|
pSurfaceCallBacks->GetBltStatus = DdGetBltStatus;
|
|
pSurfaceCallBacks->GetFlipStatus = DdGetFlipStatus;
|
|
pSurfaceCallBacks->dwFlags = DDHAL_SURFCB32_BLT
|
|
| DDHAL_SURFCB32_FLIP
|
|
| DDHAL_SURFCB32_LOCK
|
|
| DDHAL_SURFCB32_GETBLTSTATUS
|
|
| DDHAL_SURFCB32_GETFLIPSTATUS;
|
|
|
|
if (ppdev->flStatus & STAT_STREAMS_ENABLED)
|
|
{
|
|
pCallBacks->CreateSurface = DdCreateSurface;
|
|
pCallBacks->CanCreateSurface = DdCanCreateSurface;
|
|
pCallBacks->dwFlags |= DDHAL_CB32_CREATESURFACE
|
|
| DDHAL_CB32_CANCREATESURFACE;
|
|
|
|
pSurfaceCallBacks->SetColorKey = DdSetColorKey;
|
|
pSurfaceCallBacks->UpdateOverlay = DdUpdateOverlay;
|
|
pSurfaceCallBacks->SetOverlayPosition = DdSetOverlayPosition;
|
|
pSurfaceCallBacks->DestroySurface = DdDestroySurface;
|
|
pSurfaceCallBacks->dwFlags |= DDHAL_SURFCB32_SETCOLORKEY
|
|
| DDHAL_SURFCB32_UPDATEOVERLAY
|
|
| DDHAL_SURFCB32_SETOVERLAYPOSITION
|
|
| DDHAL_SURFCB32_DESTROYSURFACE;
|
|
|
|
// The DrvEnableDirectDraw call can occur while we're in full-
|
|
// screen DOS mode. Do not turn on the streams processor now
|
|
// if that's the case, instead wait until AssertMode switches
|
|
// us back to graphics mode:
|
|
|
|
}
|
|
|
|
// Note that we don't call 'vGetDisplayDuration' here, for a couple of
|
|
// reasons:
|
|
//
|
|
// o Because the system is already running, it would be disconcerting
|
|
// to pause the graphics for a good portion of a second just to read
|
|
// the refresh rate;
|
|
// o More importantly, we may not be in graphics mode right now.
|
|
//
|
|
// For both reasons, we always measure the refresh rate when we switch
|
|
// to a new mode.
|
|
|
|
return(TRUE);
|
|
}
|
|
|
|
/******************************************************************************\
|
|
*
|
|
* Function: DrvDisableDirectDraw
|
|
*
|
|
* Disable DirectDraw. This function is called when an application closes the
|
|
* DirectDraw connection.
|
|
*
|
|
* Parameters: dhpdev Handle to physical device.
|
|
*
|
|
* Returns: Nothing.
|
|
*
|
|
\******************************************************************************/
|
|
VOID DrvDisableDirectDraw(
|
|
DHPDEV dhpdev)
|
|
{
|
|
PDEV* ppdev;
|
|
OH* poh;
|
|
|
|
// DirectDraw is done with the display, so we can go back to using
|
|
// all of off-screen memory ourselves.
|
|
ppdev = (PPDEV) dhpdev;
|
|
poh = ppdev->pohDirectDraw;
|
|
|
|
if (poh)
|
|
{
|
|
DISPDBG((1, "Releasing DirectDraw surface %d x %d at (%d, %d)",
|
|
poh->cx, poh->cy, poh->x, poh->y));
|
|
}
|
|
|
|
pohFree(ppdev, poh);
|
|
ppdev->pohDirectDraw = NULL;
|
|
|
|
// Invalidate all cached fonts.
|
|
vAssertModeText(ppdev, TRUE);
|
|
}
|
|
|
|
/******************************************************************************\
|
|
*
|
|
* Function: vAssertModeDirectDraw
|
|
*
|
|
* Perform specific DirectDraw initialization when the screen switches focus
|
|
* (from graphics to full screen MS-DOS and vice versa).
|
|
*
|
|
* Parameters: ppdev Pointer to physical device.
|
|
* bEnabled True if the screen is in graphics mode.
|
|
*
|
|
* Returns: Nothing.
|
|
*
|
|
\******************************************************************************/
|
|
VOID vAssertModeDirectDraw(
|
|
PDEV* ppdev,
|
|
BOOL bEnabled)
|
|
{
|
|
}
|
|
|
|
/******************************************************************************\
|
|
*
|
|
* Function: bEnableDirectDraw
|
|
*
|
|
* Enable DirectDraw. Called from DrvEnableSurface.
|
|
*
|
|
* Parameters: ppdev Pointer to phsyical device.
|
|
*
|
|
* Returns: Nothing.
|
|
*
|
|
\******************************************************************************/
|
|
BOOL bEnableDirectDraw(
|
|
PDEV* ppdev)
|
|
{
|
|
|
|
if (DIRECT_ACCESS(ppdev) && // Direct access must be enabled.
|
|
#if (DIRECTX_24 < 1)
|
|
(ppdev->cBpp != 3) && // Turn off DirectDraw in 24-bpp.
|
|
#endif
|
|
(ppdev->flCaps & CAPS_ENGINEMANAGED) && // Only support CL-GD5436/5446.
|
|
(ppdev->flCaps & CAPS_MM_IO)) // Memory Mapped I/O must be on.
|
|
{
|
|
// We have to preserve the contents of the CR1B and CR1D registers on a
|
|
// page flip.
|
|
CP_OUT_BYTE(ppdev->pjPorts, CRTC_INDEX, 0x1B);
|
|
ppdev->ulCR1B = (CP_IN_BYTE(ppdev->pjPorts, CRTC_DATA) & 0xF2) << 8;
|
|
CP_OUT_BYTE(ppdev->pjPorts, CRTC_INDEX, 0x1D);
|
|
ppdev->ulCR1D = (CP_IN_BYTE(ppdev->pjPorts, CRTC_DATA) & 0x7F) << 8;
|
|
|
|
// Accurately measure the refresh rate for later.
|
|
vGetDisplayDuration(ppdev);
|
|
|
|
// DirectDraw is all set to be used on this card.
|
|
ppdev->flStatus |= STAT_DIRECTDRAW;
|
|
|
|
#if 1 // sge
|
|
EnableStartAddrDoubleBuffer(ppdev);
|
|
#endif // sge
|
|
}
|
|
|
|
return(TRUE);
|
|
}
|
|
|
|
/******************************************************************************\
|
|
*
|
|
* Function: vDisableDirectDraw
|
|
*
|
|
* Disbale DirectDraw. Called from DrvDisableSurface.
|
|
*
|
|
* Parameters: ppdev Pointer to physical device.
|
|
*
|
|
* Returns: Nothing.
|
|
*
|
|
\******************************************************************************/
|
|
VOID vDisableDirectDraw(
|
|
PDEV* ppdev)
|
|
{
|
|
}
|
|
|
|
#if 1 // OVERLAY #sge
|
|
/******************************************************************************\
|
|
*
|
|
* Function: GetFormatInfo
|
|
*
|
|
* Get DirectDraw information,
|
|
*
|
|
* Parameters: ppdev Pointer to physical device.
|
|
*
|
|
* Returns: Nothing.
|
|
*
|
|
\******************************************************************************/
|
|
VOID GetFormatInfo(PDEV* ppdev, LPDDPIXELFORMAT lpFormat, LPDWORD lpFourcc,
|
|
LPWORD lpBitCount)
|
|
{
|
|
|
|
if (lpFormat->dwFlags & DDPF_FOURCC)
|
|
{
|
|
*lpFourcc = lpFormat->dwFourCC;
|
|
if (lpFormat->dwFourCC == BI_RGB)
|
|
{
|
|
*lpBitCount = (WORD) lpFormat->dwRGBBitCount;
|
|
#ifdef DEBUG
|
|
if (lpFormat->dwRGBBitCount == 8)
|
|
{
|
|
DISPDBG((1, "Format: RGB 8"));
|
|
}
|
|
else if (lpFormat->dwRGBBitCount == 16)
|
|
{
|
|
DISPDBG ((1,"Format: RGB 5:5:5"));
|
|
}
|
|
#endif
|
|
}
|
|
else if (lpFormat->dwFourCC == BI_BITFIELDS)
|
|
{
|
|
if ((lpFormat->dwRGBBitCount != 16) ||
|
|
(lpFormat->dwRBitMask != 0xf800) ||
|
|
(lpFormat->dwGBitMask != 0x07e0) ||
|
|
(lpFormat->dwBBitMask != 0x001f))
|
|
{
|
|
*lpFourcc = (DWORD) -1;
|
|
}
|
|
else
|
|
{
|
|
*lpBitCount = 16;
|
|
DISPDBG((1,"Format: RGB 5:6:5"));
|
|
}
|
|
}
|
|
else
|
|
{
|
|
lpFormat->dwRBitMask = (DWORD) -1;
|
|
lpFormat->dwGBitMask = (DWORD) -1;
|
|
lpFormat->dwBBitMask = (DWORD) -1;
|
|
if (lpFormat->dwFourCC == FOURCC_PACKJR)
|
|
{
|
|
*lpBitCount = 8;
|
|
DISPDBG((1, "Format: CLJR"));
|
|
}
|
|
else if (lpFormat->dwFourCC == FOURCC_YUY2)
|
|
{
|
|
*lpBitCount = 16;
|
|
DISPDBG((1,"Format: YUY2"));
|
|
}
|
|
else
|
|
{
|
|
*lpBitCount = 16;
|
|
DISPDBG((1,"Format: UYVY"));
|
|
}
|
|
}
|
|
}
|
|
else if (lpFormat->dwFlags & DDPF_RGB)
|
|
{
|
|
if (lpFormat->dwRGBBitCount == 8)
|
|
{
|
|
*lpFourcc = BI_RGB;
|
|
DISPDBG((1, "Format: RGB 8"));
|
|
}
|
|
else if ((lpFormat->dwRGBBitCount == 16) &&
|
|
(lpFormat->dwRBitMask == 0xf800) &&
|
|
(lpFormat->dwGBitMask == 0x07e0) &&
|
|
(lpFormat->dwBBitMask == 0x001f))
|
|
{
|
|
*lpFourcc = BI_BITFIELDS;
|
|
DISPDBG((1,"Format: RGB 5:6:5"));
|
|
}
|
|
else if ((lpFormat->dwRGBBitCount == 16) &&
|
|
(lpFormat->dwRBitMask == 0x7C00) &&
|
|
(lpFormat->dwGBitMask == 0x03e0) &&
|
|
(lpFormat->dwBBitMask == 0x001f))
|
|
{
|
|
*lpFourcc = BI_RGB;
|
|
DISPDBG((1,"Format: RGB 5:5:5"));
|
|
}
|
|
else if (((lpFormat->dwRGBBitCount == 24) ||
|
|
(lpFormat->dwRGBBitCount == 32)) &&
|
|
(lpFormat->dwRBitMask == 0xff0000) &&
|
|
(lpFormat->dwGBitMask == 0x00ff00) &&
|
|
(lpFormat->dwBBitMask == 0x0000ff))
|
|
{
|
|
*lpFourcc = BI_RGB;
|
|
DISPDBG((1, "Format: RGB 8:8:8"));
|
|
}
|
|
else
|
|
{
|
|
*lpFourcc = (DWORD) -1;
|
|
}
|
|
*lpBitCount = (WORD) lpFormat->dwRGBBitCount;
|
|
}
|
|
else if (ppdev->cBitsPerPixel == 16)
|
|
{
|
|
*lpFourcc = BI_RGB;
|
|
*lpBitCount = (WORD) lpFormat->dwRGBBitCount;
|
|
}
|
|
else
|
|
{
|
|
*lpFourcc = (DWORD) -1;
|
|
}
|
|
}
|
|
|
|
/**********************************************************
|
|
*
|
|
* Name: RegInitVideo
|
|
*
|
|
* Module Abstract:
|
|
* ----------------
|
|
* This function is called to program the video format and
|
|
* the physicall offset of the video data in the frame buffer.
|
|
*
|
|
* Output Parameters:
|
|
* ------------------
|
|
* none
|
|
*
|
|
***********************************************************
|
|
* Author: Shuhua Ge
|
|
* Date: 09/24/96
|
|
*
|
|
* Revision History:
|
|
* -----------------
|
|
* WHO WHEN WHAT/WHY/HOW
|
|
* --- ---- ------------
|
|
*
|
|
*********************************************************/
|
|
|
|
VOID RegInitVideo(PDEV* ppdev, PDD_SURFACE_LOCAL lpSurface)
|
|
{
|
|
DWORD dwTemp;
|
|
DWORD dwFourcc;
|
|
LONG lPitch;
|
|
LONG lLeft;
|
|
WORD wTemp;
|
|
WORD wBitCount = 0;
|
|
RECTL rVideoRect;
|
|
BYTE bRegCR31;
|
|
BYTE bRegCR32;
|
|
BYTE bRegCR33;
|
|
BYTE bRegCR34;
|
|
BYTE bRegCR35;
|
|
BYTE bRegCR36;
|
|
BYTE bRegCR37;
|
|
BYTE bRegCR38;
|
|
BYTE bRegCR39;
|
|
BYTE bRegCR3A;
|
|
BYTE bRegCR3B;
|
|
BYTE bRegCR3C;
|
|
BYTE bRegCR3D;
|
|
BYTE bRegCR3E;
|
|
BYTE bRegCR5C;
|
|
BYTE bRegCR5D;
|
|
BYTE bTemp;
|
|
DWORD dwTemp1;
|
|
BOOL bOverlayTooSmall = FALSE;
|
|
BYTE* pjPorts = ppdev->pjPorts;
|
|
|
|
|
|
/*
|
|
* Determine the format of the video data
|
|
*/
|
|
if (lpSurface->dwFlags & DDRAWISURF_HASPIXELFORMAT)
|
|
{
|
|
GetFormatInfo(ppdev, &(lpSurface->lpGbl->ddpfSurface),
|
|
&dwFourcc, &wBitCount);
|
|
}
|
|
else
|
|
{
|
|
// This needs to be changed when primary surface is RGB 5:6:5
|
|
dwFourcc = BI_RGB;
|
|
wBitCount = (WORD) ppdev->cBitsPerPixel;
|
|
}
|
|
|
|
rVideoRect = ppdev->rOverlayDest;
|
|
lPitch = lpSurface->lpGbl->lPitch;
|
|
|
|
/*
|
|
* Determine value in CR31 (Horizontal Zoom Code)
|
|
*/
|
|
if ((ppdev->rOverlayDest.right - ppdev->rOverlayDest.left) ==
|
|
(ppdev->rOverlaySrc.right - ppdev->rOverlaySrc.left))
|
|
{
|
|
/*
|
|
* No zooming is occuring
|
|
*/
|
|
bRegCR31 = 0;
|
|
}
|
|
else
|
|
{
|
|
/*
|
|
* The zoom code = (256 * <src width>) / <dest width>
|
|
*/
|
|
dwTemp = (DWORD) ((DWORD) (ppdev->rOverlaySrc.right
|
|
- ppdev->rOverlaySrc.left)) * 256;
|
|
if (ppdev->bDoubleClock)
|
|
{
|
|
dwTemp <<= 1;
|
|
}
|
|
dwTemp1= (DWORD) (ppdev->rOverlayDest.right - ppdev->rOverlayDest.left);
|
|
dwTemp= ((2 * dwTemp) + dwTemp1) / (2*dwTemp1);
|
|
bRegCR31= (BYTE) dwTemp;
|
|
}
|
|
|
|
/*
|
|
* Determine value in CR32 (Vertical Zoom Code)
|
|
*/
|
|
if ((ppdev->rOverlayDest.bottom - ppdev->rOverlayDest.top) ==
|
|
(ppdev->rOverlaySrc.bottom - ppdev->rOverlaySrc.top))
|
|
{
|
|
/*
|
|
* No zooming is occuring
|
|
*/
|
|
bRegCR32 = 0;
|
|
}
|
|
else
|
|
{
|
|
/*
|
|
* The zoom code = (256 * <src height>) / <dest height>
|
|
* The -1 is so that it won't mangle the last line by mixing it
|
|
* with garbage data while Y interpolating.
|
|
*/
|
|
dwTemp = (DWORD) ((DWORD) ((ppdev->rOverlaySrc.bottom - 1)
|
|
- ppdev->rOverlaySrc.top)) * 256;
|
|
dwTemp /= (DWORD) (ppdev->rOverlayDest.bottom - ppdev->rOverlayDest.top);
|
|
bRegCR32 = (BYTE) dwTemp;
|
|
}
|
|
|
|
/*
|
|
* Determine value in CR33 (Region 1 Size)
|
|
*/
|
|
wTemp = (WORD) rVideoRect.left;
|
|
if (ppdev->cBitsPerPixel == 8)
|
|
{
|
|
wTemp >>= 2; // 4 Pixels per DWORD
|
|
}
|
|
else if (ppdev->cBitsPerPixel == 16)
|
|
{
|
|
wTemp >>= 1; // 2 Pixels per DWORD
|
|
}
|
|
else if (ppdev->cBitsPerPixel == 24)
|
|
{
|
|
wTemp *= 3;
|
|
wTemp /= 4;
|
|
}
|
|
bRegCR33 = (BYTE) wTemp;
|
|
bRegCR36 = (BYTE) (WORD) (wTemp >> 8);
|
|
|
|
/*
|
|
* Determine value in CR34 (Region 2 size)
|
|
*/
|
|
wTemp = (WORD) (rVideoRect.right - rVideoRect.left);
|
|
if (ppdev->cBitsPerPixel == 8)
|
|
{
|
|
wTemp >>= 2; // 4 Pixels per DWORD
|
|
}
|
|
else if (ppdev->cBitsPerPixel == 16)
|
|
{
|
|
wTemp >>= 1; // 2 Pixels per DWORD
|
|
}
|
|
else if (ppdev->cBitsPerPixel == 24)
|
|
{
|
|
wTemp *= 3;
|
|
wTemp /= 4;
|
|
}
|
|
bRegCR34 = (BYTE) wTemp;
|
|
wTemp >>= 6;
|
|
bRegCR36 |= (BYTE) (wTemp & 0x0C);
|
|
|
|
/*
|
|
* Determine value in CR35 (Region 2 SDSize)
|
|
*/
|
|
dwTemp = (DWORD) (rVideoRect.right - rVideoRect.left);
|
|
dwTemp *= (DWORD) (ppdev->rOverlaySrc.right - ppdev->rOverlaySrc.left);
|
|
dwTemp /= (DWORD) (ppdev->rOverlayDest.right - ppdev->rOverlayDest.left);
|
|
wTemp = (WORD) dwTemp;
|
|
if ((dwFourcc == FOURCC_PACKJR) || (wBitCount == 8))
|
|
{
|
|
wTemp >>= 2; // 4 Pixels per DWORD
|
|
}
|
|
else
|
|
{
|
|
wTemp >>= 1; // 2 Pixels per DWORD
|
|
}
|
|
bRegCR35 = (BYTE) wTemp;
|
|
wTemp >>= 4;
|
|
bRegCR36 |= (BYTE) (wTemp & 0x30);
|
|
|
|
//
|
|
// Check double scan line counter feature
|
|
//
|
|
CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x17);
|
|
bTemp = CP_IN_BYTE(pjPorts, CRTC_DATA);
|
|
if (bTemp & 0x04)
|
|
{
|
|
//
|
|
// Double scan line count
|
|
//
|
|
/*
|
|
* Determine value in CR37 (Vertical Start)
|
|
*/
|
|
wTemp = (WORD) rVideoRect.top;
|
|
bRegCR37 = (BYTE)(wTemp >> 1);
|
|
if ( wTemp & 0x01 )
|
|
{
|
|
wTemp >>= 9;
|
|
bRegCR39 = (BYTE) wTemp | 0x10;
|
|
//
|
|
// Odd scan line trigger
|
|
// Hardware has a bug now.
|
|
// So reduce dest end by 1
|
|
//
|
|
wTemp = (WORD) rVideoRect.bottom - 1 - 1;
|
|
}
|
|
else
|
|
{
|
|
wTemp >>= 9;
|
|
bRegCR39 = (BYTE) wTemp;
|
|
/*
|
|
* Determine value in CR38 (Vertical End)
|
|
*/
|
|
wTemp = (WORD) rVideoRect.bottom - 1;
|
|
}
|
|
bRegCR38 = (BYTE)(wTemp >> 1);
|
|
if (wTemp & 0x01)
|
|
bRegCR39 |= 0x20;
|
|
wTemp >>= 7;
|
|
bRegCR39 |= (BYTE) (wTemp & 0x0C);
|
|
}
|
|
else
|
|
{
|
|
/*
|
|
* Determine value in CR37 (Vertical Start)
|
|
*/
|
|
wTemp = (WORD) rVideoRect.top;
|
|
bRegCR37 = (BYTE) wTemp;
|
|
wTemp >>= 8;
|
|
bRegCR39 = (BYTE) wTemp;
|
|
|
|
/*
|
|
* Determine value in CR38 (Vertical End)
|
|
*/
|
|
wTemp = (WORD) rVideoRect.bottom - 1;
|
|
bRegCR38 = (BYTE) wTemp;
|
|
wTemp >>= 6;
|
|
bRegCR39 |= (BYTE) (wTemp & 0x0C);
|
|
}
|
|
/*
|
|
* Determine values in CR3A, CR3B, CR3C (Start Address)
|
|
*/
|
|
dwTemp = 0;
|
|
|
|
|
|
if (bRegCR31 != 0)
|
|
{
|
|
//
|
|
// overlay is zoomed, re-initialize zoom factor
|
|
//
|
|
CalculateStretchCode(ppdev->rOverlaySrc.right - ppdev->rOverlaySrc.left,
|
|
ppdev->rOverlayDest.right - ppdev->rOverlayDest.left, ppdev->HorStretchCode);
|
|
}
|
|
|
|
//
|
|
// Here, we want to ensure the source rectangle's clipped width is bigger
|
|
// than what the HW can support, sigh!
|
|
//
|
|
if (!bOverlayTooSmall)
|
|
{
|
|
LONG lSrcPels;
|
|
|
|
//
|
|
// compute non-clip amount on right edge
|
|
//
|
|
lSrcPels = rVideoRect.right - rVideoRect.left;
|
|
|
|
if (bRegCR31 != 0) // source is zoomed if non-zero
|
|
{
|
|
WORD wRightCnt;
|
|
|
|
wRightCnt = 0;
|
|
while (lSrcPels > 0)
|
|
{
|
|
lSrcPels -= ppdev->HorStretchCode[wRightCnt];
|
|
if (lSrcPels >= 0)
|
|
{
|
|
wRightCnt++;
|
|
}
|
|
}
|
|
lSrcPels = (LONG)wRightCnt;
|
|
}
|
|
|
|
if ((lSrcPels == 0) || (lSrcPels <= MIN_OLAY_WIDTH))
|
|
{
|
|
bOverlayTooSmall = TRUE;
|
|
}
|
|
}
|
|
|
|
lLeft = ppdev->rOverlaySrc.left;
|
|
if (dwFourcc == FOURCC_PACKJR)
|
|
{
|
|
lLeft &= ~0x03;
|
|
}
|
|
else if (dwFourcc == FOURCC_YUV422 || dwFourcc == FOURCC_YUY2 )
|
|
{
|
|
lLeft &= ~0x01;
|
|
}
|
|
|
|
//
|
|
// dwTemp has adjusted dest. rect., add in source adjustment
|
|
//
|
|
dwTemp += (ppdev->rOverlaySrc.top * lPitch) + ((lLeft * wBitCount) >>3);
|
|
|
|
ppdev->sOverlay1.lAdjustSource = dwTemp;
|
|
// dwTemp += ((BYTE*)lpSurface->lpGbl->fpVidMem - ppdev->pjScreen); // sss
|
|
dwTemp += (DWORD)(lpSurface->lpGbl->fpVidMem);
|
|
|
|
bRegCR5D = (BYTE) ((dwTemp << 2) & 0x0C);
|
|
dwTemp >>= 2;
|
|
bRegCR3A = (BYTE) dwTemp & 0xfe; // Align to even byte (5446 bug)
|
|
dwTemp >>= 8;
|
|
bRegCR3B = (BYTE) dwTemp;
|
|
dwTemp >>= 8;
|
|
bRegCR3C = (BYTE) (dwTemp & 0x0f);
|
|
|
|
/*
|
|
* Determine value in CR3D (Address Offset/Pitch)
|
|
*/
|
|
wTemp = (WORD) (lPitch >> 3);
|
|
if (lpSurface->dwReserved1 & OVERLAY_FLG_DECIMATE)
|
|
{
|
|
wTemp >>= 1;
|
|
}
|
|
bRegCR3D = (BYTE) wTemp;
|
|
wTemp >>= 3;
|
|
bRegCR3C |= (BYTE) (wTemp & 0x20);
|
|
|
|
/*
|
|
* Determine value in CR3E (Master Control Register)
|
|
*/
|
|
bRegCR3E = 0;
|
|
if (lpSurface->dwReserved1 & OVERLAY_FLG_ENABLED)
|
|
{
|
|
bRegCR3E = 0x01;
|
|
}
|
|
if (dwFourcc == FOURCC_PACKJR)
|
|
{
|
|
bRegCR3E |= 0x20; // Always error difuse when using PackJR
|
|
}
|
|
if ((bRegCR32 == 0) || MustLineReplicate (ppdev, lpSurface, wBitCount))
|
|
{
|
|
bRegCR3E |= 0x10;
|
|
lpSurface->dwReserved1 &= ~OVERLAY_FLG_INTERPOLATE;
|
|
}
|
|
else
|
|
{
|
|
lpSurface->dwReserved1 |= OVERLAY_FLG_INTERPOLATE;
|
|
}
|
|
if (dwFourcc == FOURCC_PACKJR)
|
|
{
|
|
bRegCR3E |= 0x02;
|
|
}
|
|
else if (dwFourcc == BI_RGB)
|
|
{
|
|
if (wBitCount == 16)
|
|
{
|
|
bRegCR3E |= 0x08;
|
|
}
|
|
else if (wBitCount == 8)
|
|
{
|
|
bRegCR3E |= 0x04;
|
|
}
|
|
}
|
|
else if (dwFourcc == BI_BITFIELDS)
|
|
{
|
|
bRegCR3E |= 0x0A;
|
|
}
|
|
|
|
/*
|
|
* If we are color keying, we will set that up now
|
|
*/
|
|
if (lpSurface->dwReserved1 & OVERLAY_FLG_COLOR_KEY)
|
|
{
|
|
bRegCR3E |= 0x80;
|
|
|
|
CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x1a);
|
|
bTemp = CP_IN_BYTE(pjPorts, CRTC_DATA); // Set CR1A[3:2] to timing ANDed w/ color
|
|
bTemp &= ~0x0C;
|
|
CP_OUT_BYTE(pjPorts, CRTC_DATA, bTemp);
|
|
|
|
CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x1d); // Clear CR1D[5:4]
|
|
bTemp = CP_IN_BYTE(pjPorts, CRTC_DATA);
|
|
if (ppdev->cBitsPerPixel == 8)
|
|
{
|
|
CP_OUT_BYTE(pjPorts, CRTC_DATA, bTemp & ~0x38);
|
|
CP_OUT_WORD(pjPorts, INDEX_REG, (ppdev->wColorKey << 8) | 0x0c); // Output color to GRC
|
|
CP_OUT_WORD(pjPorts, INDEX_REG, 0x0d); // Output color to GRD
|
|
}
|
|
else
|
|
{
|
|
CP_OUT_BYTE(pjPorts, CRTC_DATA, (bTemp & ~0x30) | 0x08);
|
|
CP_OUT_WORD(pjPorts, INDEX_REG, (ppdev->wColorKey << 8) | 0x0c); // Output color to GRC
|
|
CP_OUT_WORD(pjPorts, INDEX_REG, (ppdev->wColorKey & 0xff00) | 0x0d);// Output color to GRD
|
|
}
|
|
}
|
|
else if (lpSurface->dwReserved1 & OVERLAY_FLG_SRC_COLOR_KEY)
|
|
{
|
|
BYTE bYMax, bYMin, bUMax, bUMin, bVMax, bVMin;
|
|
|
|
bRegCR3E |= 0x80;
|
|
|
|
CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x1a);
|
|
bTemp = CP_IN_BYTE(pjPorts, CRTC_DATA); // Set CR1A[3:2] to timing ANDed w/ color
|
|
bTemp &= ~0x0C;
|
|
CP_OUT_BYTE(pjPorts, CRTC_DATA, bTemp);
|
|
|
|
CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x1d); // Set CR1D[5:4] to 10
|
|
CP_OUT_BYTE(pjPorts, CRTC_DATA, CP_IN_BYTE(pjPorts, CRTC_DATA) | 0x20);
|
|
|
|
/*
|
|
* Determine min/max values
|
|
*/
|
|
if ((dwFourcc == FOURCC_YUV422) ||
|
|
(dwFourcc == FOURCC_YUY2) ||
|
|
(dwFourcc == FOURCC_PACKJR))
|
|
{
|
|
bYMax = (BYTE)(DWORD)(ppdev->dwSrcColorKeyHigh >> 16);
|
|
bYMin = (BYTE)(DWORD)(ppdev->dwSrcColorKeyLow >> 16);
|
|
bUMax = (BYTE)(DWORD)((ppdev->dwSrcColorKeyHigh >> 8) & 0xff);
|
|
bUMin = (BYTE)(DWORD)((ppdev->dwSrcColorKeyLow >> 8) & 0xff);
|
|
bVMax = (BYTE)(ppdev->dwSrcColorKeyHigh & 0xff);
|
|
bVMin = (BYTE)(ppdev->dwSrcColorKeyLow & 0xff);
|
|
if (dwFourcc == FOURCC_PACKJR)
|
|
{
|
|
bYMax |= 0x07;
|
|
bUMax |= 0x03;
|
|
bVMax |= 0x03;
|
|
bYMin &= ~0x07;
|
|
bUMin &= ~0x03;
|
|
bVMin &= ~0x03;
|
|
}
|
|
}
|
|
else if ((dwFourcc == 0) && (wBitCount == 16))
|
|
{
|
|
/*
|
|
* RGB 5:5:5
|
|
*/
|
|
bYMax = (BYTE)(DWORD)((ppdev->dwSrcColorKeyHigh >> 7) & 0xF8);
|
|
bYMin = (BYTE)(DWORD)((ppdev->dwSrcColorKeyLow >> 7) & 0xF8);
|
|
bUMax = (BYTE)(DWORD)((ppdev->dwSrcColorKeyHigh >> 2) & 0xF8);
|
|
bUMin = (BYTE)(DWORD)((ppdev->dwSrcColorKeyLow >> 2) & 0xF8);
|
|
bVMax = (BYTE)(ppdev->dwSrcColorKeyHigh << 3);
|
|
bVMin = (BYTE)(ppdev->dwSrcColorKeyLow << 3);
|
|
bYMax |= 0x07;
|
|
bUMax |= 0x07;
|
|
bVMax |= 0x07;
|
|
|
|
}
|
|
else if (dwFourcc == BI_BITFIELDS)
|
|
{
|
|
/*
|
|
* RGB 5:6:5
|
|
*/
|
|
bYMax = (BYTE)(DWORD)((ppdev->dwSrcColorKeyHigh >> 8) & 0xF8);
|
|
bYMin = (BYTE)(DWORD)((ppdev->dwSrcColorKeyLow >> 8) & 0xF8);
|
|
bUMax = (BYTE)(DWORD)((ppdev->dwSrcColorKeyHigh >> 3) & 0xFC);
|
|
bUMin = (BYTE)(DWORD)((ppdev->dwSrcColorKeyLow >> 3) & 0xFC);
|
|
bVMax = (BYTE)(ppdev->dwSrcColorKeyHigh << 3);
|
|
bVMin = (BYTE)(ppdev->dwSrcColorKeyLow << 3);
|
|
bYMax |= 0x07;
|
|
bUMax |= 0x03;
|
|
bVMax |= 0x07;
|
|
}
|
|
|
|
CP_OUT_WORD(pjPorts, INDEX_REG, ((WORD)bYMin << 8) | 0x0C); // GRC
|
|
CP_OUT_WORD(pjPorts, INDEX_REG, ((WORD)bYMax << 8) | 0x0D); // GRD
|
|
CP_OUT_WORD(pjPorts, INDEX_REG, ((WORD)bUMin << 8) | 0x1C); // GR1C
|
|
CP_OUT_WORD(pjPorts, INDEX_REG, ((WORD)bUMax << 8) | 0x1D); // GR1D
|
|
CP_OUT_WORD(pjPorts, INDEX_REG, ((WORD)bVMin << 8) | 0x1E); // GR1E
|
|
CP_OUT_WORD(pjPorts, INDEX_REG, ((WORD)bVMax << 8) | 0x1F); // GR1F
|
|
}
|
|
else
|
|
{
|
|
CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x1a);
|
|
bTemp = CP_IN_BYTE(pjPorts, CRTC_DATA); // Clear CR1A[3:2]
|
|
CP_OUT_BYTE(pjPorts, CRTC_DATA, bTemp & ~0x0C);
|
|
}
|
|
|
|
/*
|
|
* Set up alignment info
|
|
*/
|
|
if (ppdev->cBitsPerPixel != 24)
|
|
{
|
|
WORD wXAlign;
|
|
WORD wXSize;
|
|
|
|
if (ppdev->cBitsPerPixel == 8)
|
|
{
|
|
wXAlign = (WORD)rVideoRect.left & 0x03;
|
|
wXSize = (WORD)(rVideoRect.right - rVideoRect.left) & 0x03;
|
|
}
|
|
else
|
|
{
|
|
wXAlign = (WORD)(rVideoRect.left & 0x01) << 1;
|
|
wXSize = (WORD)((rVideoRect.right - rVideoRect.left) & 0x01) << 1;
|
|
}
|
|
bRegCR5D |= (BYTE) (wXAlign | (wXSize << 4));
|
|
}
|
|
else
|
|
{
|
|
bRegCR5D = 0;
|
|
}
|
|
|
|
/*
|
|
* Set up the FIFO threshold value. Make sure that the value we use is
|
|
* not less than the default value.
|
|
*/
|
|
CP_OUT_BYTE(pjPorts, SR_INDEX, 0x16);
|
|
bTemp = CP_IN_BYTE(pjPorts, SR_DATA) & 0x0f;
|
|
if (bTemp > (ppdev->lFifoThresh & 0x0f))
|
|
{
|
|
ppdev->lFifoThresh = bTemp;
|
|
}
|
|
if (ppdev->lFifoThresh < 0x0f)
|
|
{
|
|
ppdev->lFifoThresh++; // Eliminates possible errata
|
|
}
|
|
bRegCR5C = 0x10 | ((BYTE) ppdev->lFifoThresh & 0x0f);
|
|
|
|
|
|
/*
|
|
* Now start programming the registers
|
|
*/
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR31 << 8) | 0x31); // CR31
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR32 << 8) | 0x32); // CR32
|
|
if (lpSurface->dwReserved1 & OVERLAY_FLG_YUVPLANAR)
|
|
{
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) 0x10 << 8) | 0x3F); // CR3F
|
|
}
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR5C << 8) | 0x5C); // CR5C
|
|
|
|
//
|
|
// disable overlay if overlay is too small to be supported by HW
|
|
//
|
|
if (bOverlayTooSmall)
|
|
{
|
|
bRegCR3E &= ~0x01; // disable overlay
|
|
ppdev->dwPanningFlag |= OVERLAY_OLAY_REENABLE; // totally clipped
|
|
}
|
|
else
|
|
{
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR33 << 8) | 0x33); // CR33
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR34 << 8) | 0x34); // CR34
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR35 << 8) | 0x35); // CR35
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR36 << 8) | 0x36); // CR36
|
|
// CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR37 << 8) | 0x37); // CR37
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR38 << 8) | 0x38); // CR38
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR39 << 8) | 0x39); // CR39
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR3A << 8) | 0x3A); // CR3A
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR3B << 8) | 0x3B); // CR3B
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR3C << 8) | 0x3C); // CR3C
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR3D << 8) | 0x3D); // CR3D
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR5D << 8) | 0x5D); // CR5D
|
|
//
|
|
// Write Vertical start first
|
|
//
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR37 << 8) | 0x37); // CR37
|
|
}
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR3E << 8) | 0x3E); // CR3E
|
|
}
|
|
|
|
|
|
/**********************************************************
|
|
* Name: DisableOverlay_544x
|
|
*
|
|
* Module Abstract:
|
|
* ----------------
|
|
* This is called when an overlay window is totally clipped by
|
|
* the panning viewport.
|
|
**********************************************************/
|
|
VOID DisableOverlay_544x(PDEV* ppdev)
|
|
{
|
|
WORD wCR3E;
|
|
BYTE* pjPorts = ppdev->pjPorts;
|
|
|
|
ppdev->dwPanningFlag |= OVERLAY_OLAY_REENABLE;
|
|
CP_OUT_BYTE(pjPorts, CRTC_INDEX,0x3e); //Video Window Master Control
|
|
wCR3E = CP_IN_WORD(pjPorts, CRTC_INDEX) & ~0x100; //clear bit one
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, wCR3E); //disable overlay window
|
|
}
|
|
|
|
|
|
/**********************************************************
|
|
* Name: EnableOverlay_544x
|
|
*
|
|
* Module Abstract:
|
|
* ----------------
|
|
* Show the overlay window.
|
|
**********************************************************/
|
|
VOID EnableOverlay_544x(PDEV* ppdev)
|
|
{
|
|
WORD wCR3E;
|
|
BYTE* pjPorts = ppdev->pjPorts;
|
|
|
|
ppdev->dwPanningFlag &= ~OVERLAY_OLAY_REENABLE;
|
|
CP_OUT_BYTE(pjPorts, CRTC_INDEX,0x3e); //Video Window Master Control
|
|
wCR3E = CP_IN_WORD(pjPorts, CRTC_INDEX) | 0x100; //clear bit one
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, wCR3E); //disable overlay window
|
|
}
|
|
|
|
|
|
/**********************************************************
|
|
*
|
|
* Name: ClearAltFIFOThreshold_544x
|
|
*
|
|
* Module Abstract:
|
|
* ----------------
|
|
*
|
|
*
|
|
* Output Parameters:
|
|
* ------------------
|
|
* none
|
|
*
|
|
***********************************************************
|
|
* Author: Shuhua Ge
|
|
* Date: 02/03/97
|
|
*
|
|
* Revision History:
|
|
* -----------------
|
|
* WHO WHEN WHAT/WHY/HOW
|
|
* --- ---- ------------
|
|
*
|
|
*********************************************************/
|
|
VOID ClearAltFIFOThreshold_544x(PDEV * ppdev)
|
|
{
|
|
UCHAR bTemp;
|
|
|
|
BYTE* pjPorts = ppdev->pjPorts;
|
|
DISPDBG((1, "ClearAltFIFOThreshold"));
|
|
|
|
CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x5c); // Clear Alt FIFO Threshold
|
|
bTemp = CP_IN_BYTE(pjPorts, CRTC_DATA);
|
|
CP_OUT_BYTE(pjPorts, CRTC_DATA, bTemp & ~0x10);
|
|
}
|
|
|
|
/**********************************************************
|
|
*
|
|
* Name: RegMoveVideo
|
|
*
|
|
* Module Abstract:
|
|
* ----------------
|
|
* This function is called to move the video window that has
|
|
* already been programed.
|
|
*
|
|
* Output Parameters:
|
|
* ------------------
|
|
* none
|
|
*
|
|
***********************************************************
|
|
* Author: Shuhua Ge
|
|
* Date: 09/25/96
|
|
*
|
|
* Revision History:
|
|
* -----------------
|
|
* WHO WHEN WHAT/WHY/HOW
|
|
* --- ---- ------------
|
|
*
|
|
*********************************************************/
|
|
|
|
VOID RegMoveVideo(PDEV* ppdev, PDD_SURFACE_LOCAL lpSurface)
|
|
{
|
|
BOOL bZoomX;
|
|
DWORD dwTemp;
|
|
DWORD dwFourcc;
|
|
LONG lLeft;
|
|
LONG lPitch;
|
|
WORD wTemp;
|
|
WORD wBitCount = 0;
|
|
RECTL rVideoRect;
|
|
BYTE bRegCR33;
|
|
BYTE bRegCR34;
|
|
BYTE bRegCR35;
|
|
BYTE bRegCR36;
|
|
BYTE bRegCR37;
|
|
BYTE bRegCR38;
|
|
BYTE bRegCR39;
|
|
BYTE bRegCR3A;
|
|
BYTE bRegCR3B;
|
|
BYTE bRegCR3C;
|
|
BYTE bRegCR3D;
|
|
BYTE bRegCR5D;
|
|
BYTE bTemp;
|
|
BYTE* pjPorts = ppdev->pjPorts;
|
|
|
|
/*
|
|
* Determine the format of the video data
|
|
*/
|
|
if (lpSurface->dwFlags & DDRAWISURF_HASPIXELFORMAT)
|
|
{
|
|
GetFormatInfo(ppdev, &(lpSurface->lpGbl->ddpfSurface),
|
|
&dwFourcc, &wBitCount);
|
|
}
|
|
else
|
|
{
|
|
// This needs to be changed when primary surface is RGB 5:6:5
|
|
dwFourcc = BI_RGB;
|
|
wBitCount = (WORD) ppdev->cBitsPerPixel;
|
|
}
|
|
|
|
rVideoRect = ppdev->rOverlayDest;
|
|
//
|
|
// rVideoRect is now adjusted and clipped to the panning viewport.
|
|
// Disable overlay if totally clipped by viewport.
|
|
//
|
|
if (((rVideoRect.right - rVideoRect.left) <= 0) ||
|
|
((rVideoRect.bottom- rVideoRect.top ) <= 0))
|
|
{
|
|
DisableOverlay_544x(ppdev); // #ew1 cannot display below min. overlay size
|
|
return;
|
|
}
|
|
|
|
lPitch = lpSurface->lpGbl->lPitch;
|
|
|
|
/*
|
|
* Determine value in CR33 (Region 1 Size)
|
|
*/
|
|
wTemp = (WORD) rVideoRect.left;
|
|
if (ppdev->cBitsPerPixel == 8)
|
|
{
|
|
wTemp >>= 2; // 4 Pixels per DWORD
|
|
}
|
|
else if (ppdev->cBitsPerPixel == 16)
|
|
{
|
|
wTemp >>= 1; // 2 Pixels per DWORD
|
|
}
|
|
else if (ppdev->cBitsPerPixel == 24)
|
|
{
|
|
wTemp *= 3;
|
|
wTemp /= 4;
|
|
}
|
|
bRegCR33 = (BYTE) wTemp;
|
|
bRegCR36 = (BYTE) (WORD) (wTemp >> 8);
|
|
|
|
/*
|
|
* Determine value in CR34 (Region 2 size)
|
|
*/
|
|
wTemp = (WORD) (rVideoRect.right - rVideoRect.left);
|
|
if (ppdev->cBitsPerPixel == 8)
|
|
{
|
|
wTemp >>= 2; // 4 Pixels per DWORD
|
|
}
|
|
else if (ppdev->cBitsPerPixel == 16)
|
|
{
|
|
wTemp >>= 1; // 2 Pixels per DWORD
|
|
}
|
|
else if (ppdev->cBitsPerPixel == 24)
|
|
{
|
|
wTemp *= 3;
|
|
wTemp /= 4;
|
|
}
|
|
bRegCR34 = (BYTE) wTemp;
|
|
wTemp >>= 6;
|
|
bRegCR36 |= (BYTE) (wTemp & 0x0C);
|
|
|
|
/*
|
|
* Determine value in CR35 (Region 2SD Size)
|
|
*/
|
|
dwTemp = (DWORD) (rVideoRect.right - rVideoRect.left);
|
|
dwTemp *= (DWORD) (ppdev->rOverlaySrc.right - ppdev->rOverlaySrc.left);
|
|
dwTemp /= (DWORD) (ppdev->rOverlayDest.right - ppdev->rOverlayDest.left);
|
|
wTemp = (WORD) dwTemp;
|
|
if ((dwFourcc == FOURCC_PACKJR) || (wBitCount == 8))
|
|
{
|
|
wTemp >>= 2; // 4 Pixels per DWORD
|
|
}
|
|
else
|
|
{
|
|
wTemp >>= 1; // 2 Pixels per DWORD
|
|
}
|
|
bRegCR35 = (BYTE) wTemp;
|
|
wTemp >>= 4;
|
|
bRegCR36 |= (BYTE) (wTemp & 0x30);
|
|
|
|
//
|
|
// Check double scan line counter feature
|
|
//
|
|
CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x17);
|
|
bTemp = CP_IN_BYTE(pjPorts, CRTC_DATA);
|
|
if (bTemp & 0x04)
|
|
{
|
|
//
|
|
// Double scan line count
|
|
//
|
|
/*
|
|
* Determine value in CR37 (Vertical Start)
|
|
*/
|
|
wTemp = (WORD) rVideoRect.top;
|
|
bRegCR37 = (BYTE)(wTemp >> 1);
|
|
if ( wTemp & 0x01 )
|
|
{
|
|
wTemp >>= 9;
|
|
bRegCR39 = (BYTE) wTemp | 0x10;
|
|
//
|
|
// Odd scan line trigger
|
|
// Hardware has a bug now.
|
|
// So reduce dest end by 1
|
|
//
|
|
wTemp = (WORD) rVideoRect.bottom - 1 - 1;
|
|
}
|
|
else
|
|
{
|
|
wTemp >>= 9;
|
|
bRegCR39 = (BYTE) wTemp;
|
|
/*
|
|
* Determine value in CR38 (Vertical End)
|
|
*/
|
|
wTemp = (WORD) rVideoRect.bottom - 1;
|
|
}
|
|
bRegCR38 = (BYTE)(wTemp >> 1);
|
|
if (wTemp & 0x01)
|
|
bRegCR39 |= 0x20;
|
|
wTemp >>= 7;
|
|
bRegCR39 |= (BYTE) (wTemp & 0x0C);
|
|
}
|
|
else
|
|
{
|
|
/*
|
|
* Determine value in CR37 (Vertical Start)
|
|
*/
|
|
wTemp = (WORD) rVideoRect.top;
|
|
//if (ppdev->bDoubleClock)
|
|
//{
|
|
// wTemp >>= 1;
|
|
//}
|
|
bRegCR37 = (BYTE) wTemp;
|
|
wTemp >>= 8;
|
|
bRegCR39 = (BYTE) wTemp;
|
|
|
|
/*
|
|
* Determine value in CR38 (Vertical End)
|
|
*/
|
|
wTemp = (WORD) rVideoRect.bottom - 1;
|
|
//if (ppdev->bDoubleClock)
|
|
//{
|
|
// wTemp >>= 1;
|
|
//}
|
|
bRegCR38 = (BYTE) wTemp;
|
|
wTemp >>= 6;
|
|
bRegCR39 |= (BYTE) (wTemp & 0x0C);
|
|
}
|
|
|
|
|
|
/*
|
|
* Determine values in CR3A, CR3B, CR3C (Start Address)
|
|
*/
|
|
dwTemp = 0;
|
|
|
|
|
|
bZoomX = ((ppdev->rOverlayDest.right - ppdev->rOverlayDest.left) !=
|
|
(ppdev->rOverlaySrc.right - ppdev->rOverlaySrc.left));
|
|
|
|
if (bZoomX)
|
|
{
|
|
//
|
|
// overlay is zoomed, re-initialize zoom factor
|
|
//
|
|
CalculateStretchCode(ppdev->rOverlaySrc.right - ppdev->rOverlaySrc.left,
|
|
ppdev->rOverlayDest.right - ppdev->rOverlayDest.left, ppdev->HorStretchCode);
|
|
}
|
|
|
|
|
|
//
|
|
// Here, we want to ensure the source rectangle's clipped width is bigger
|
|
// than what the HW can support, sigh!
|
|
//
|
|
// if (grOverlayDest.right > sData->rViewport.right)
|
|
{
|
|
int iSrcPels;
|
|
|
|
//
|
|
// compute non-clip amount on right edge
|
|
//
|
|
iSrcPels = (int)(rVideoRect.right - rVideoRect.left);
|
|
|
|
if (bZoomX)
|
|
{
|
|
WORD wRightCnt;
|
|
|
|
wRightCnt = 0;
|
|
while (iSrcPels > 0)
|
|
{
|
|
iSrcPels -= ppdev->HorStretchCode[wRightCnt];
|
|
if (iSrcPels >= 0)
|
|
{
|
|
wRightCnt++;
|
|
}
|
|
}
|
|
iSrcPels = (int)wRightCnt;
|
|
}
|
|
|
|
if ((iSrcPels == 0) || (iSrcPels <= MIN_OLAY_WIDTH))
|
|
{
|
|
DisableOverlay_544x(ppdev); // cannot display below min. overlay size
|
|
return;
|
|
}
|
|
}
|
|
|
|
|
|
lLeft = ppdev->rOverlaySrc.left;
|
|
if (dwFourcc == FOURCC_PACKJR)
|
|
{
|
|
lLeft &= ~0x03;
|
|
}
|
|
else if (dwFourcc == FOURCC_YUV422 || dwFourcc == FOURCC_YUY2)
|
|
{
|
|
lLeft &= ~0x01;
|
|
}
|
|
|
|
//
|
|
// #ew1 dwTemp has adjusted dest. rect., add in source adjustment
|
|
//
|
|
dwTemp += (ppdev->rOverlaySrc.top * lPitch) + ((lLeft * wBitCount) >>3);
|
|
|
|
ppdev->sOverlay1.lAdjustSource = dwTemp;
|
|
|
|
// dwTemp += ((BYTE*)lpSurface->lpGbl->fpVidMem - ppdev->pjScreen); // sss
|
|
dwTemp += (DWORD)(lpSurface->lpGbl->fpVidMem);
|
|
|
|
bRegCR5D = (BYTE) ((dwTemp << 2) & 0x0C);
|
|
dwTemp >>= 2;
|
|
bRegCR3A = (BYTE) dwTemp & 0xfe; // Align to even byte (5446 bug)
|
|
dwTemp >>= 8;
|
|
bRegCR3B = (BYTE) dwTemp;
|
|
dwTemp >>= 8;
|
|
bRegCR3C = (BYTE) (dwTemp & 0x0f);
|
|
|
|
/*
|
|
* Determine value in CR3D (Address Offset/Pitch)
|
|
*/
|
|
wTemp = (WORD) (lPitch >> 3);
|
|
if (lpSurface->dwReserved1 & OVERLAY_FLG_DECIMATE)
|
|
{
|
|
wTemp >>= 1;
|
|
}
|
|
bRegCR3D = (BYTE) wTemp;
|
|
wTemp >>= 3;
|
|
bRegCR3C |= (BYTE) (wTemp & 0x20);
|
|
|
|
/*
|
|
* Set up alignment info
|
|
*/
|
|
if (ppdev->cBitsPerPixel != 24)
|
|
{
|
|
WORD wXAlign;
|
|
WORD wXSize;
|
|
|
|
if (ppdev->cBitsPerPixel == 8)
|
|
{
|
|
wXAlign = (WORD)rVideoRect.left & 0x03;
|
|
wXSize = (WORD)(rVideoRect.right - rVideoRect.left) & 0x03;
|
|
}
|
|
else
|
|
{
|
|
wXAlign = (WORD)(rVideoRect.left & 0x01) << 1;
|
|
wXSize = (WORD)((rVideoRect.right - rVideoRect.left) & 0x01) << 1;
|
|
}
|
|
bRegCR5D |= (BYTE) (wXAlign | (wXSize << 4));
|
|
}
|
|
|
|
/*
|
|
* Now we will write the actual register values.
|
|
*/
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR33 << 8) | 0x33); // CR33
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR34 << 8) | 0x34); // CR34
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR35 << 8) | 0x35); // CR35
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR36 << 8) | 0x36); // CR36
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR38 << 8) | 0x38); // CR38
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR39 << 8) | 0x39); // CR39
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR3A << 8) | 0x3A); // CR3A
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR3B << 8) | 0x3B); // CR3B
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR3C << 8) | 0x3C); // CR3C
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR3D << 8) | 0x3D); // CR3D
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR5D << 8) | 0x5D); // CR5D
|
|
CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR37 << 8) | 0x37); // CR37
|
|
|
|
if (ppdev->dwPanningFlag & OVERLAY_OLAY_REENABLE)
|
|
EnableOverlay_544x(ppdev);
|
|
}
|
|
|
|
|
|
/**********************************************************
|
|
*
|
|
* Name: CalculateStretchCode
|
|
*
|
|
* Module Abstract:
|
|
* ----------------
|
|
* This code was originally written by Intel and distributed
|
|
* with the DCI development kit.
|
|
*
|
|
* This function takes the zoom factor and determines exactly
|
|
* how many times we need to replicate each row/column.
|
|
*
|
|
* Output Parameters:
|
|
* ------------------
|
|
* none
|
|
*
|
|
***********************************************************
|
|
* Author: Intel
|
|
* Date: ??/??/??
|
|
*
|
|
* Revision History:
|
|
* -----------------
|
|
* WHO WHEN WHAT/WHY/HOW
|
|
* --- ---- ------------
|
|
* Scott MacDonald 10/06/94 Incorporated code into DCI provider.
|
|
*
|
|
*********************************************************/
|
|
|
|
VOID CalculateStretchCode (LONG srcLength, LONG dstLength, LPBYTE code)
|
|
{
|
|
LONG dwDeltaX, dwDeltaY, dwConst1, dwConst2, dwP;
|
|
LONG i, j, k;
|
|
BYTE bStretchIndex = 0;
|
|
LONG total = 0;
|
|
|
|
/*
|
|
* for some strange reason I'd like to figure out but haven't got time to, the
|
|
* replication code generation seems to have a problem between 1:1 and 2:1 stretch
|
|
* ratios. Fix is to zero-initialize index (the problem occurs in the first one
|
|
* generated) when stretch is betw. those ratios, and one-initialize it otherwise.
|
|
*/
|
|
if ((dstLength <= srcLength * 2L) && (dstLength >= srcLength))
|
|
{
|
|
bStretchIndex = 0;
|
|
}
|
|
else
|
|
{
|
|
bStretchIndex = 1;
|
|
}
|
|
|
|
/*
|
|
* initialize code array, to get rid of anything which might have been
|
|
* left over in it.
|
|
*/
|
|
for (i = 0; i < srcLength; i++)
|
|
{
|
|
code[i] = 0;
|
|
}
|
|
|
|
/*
|
|
* Variable names roughly represent what you will find in any graphics
|
|
* text. Consult text for an explanation of Bresenham line alg., it's
|
|
* beyond the scope of my comments here.
|
|
*/
|
|
dwDeltaX = srcLength;
|
|
dwDeltaY = dstLength;
|
|
|
|
if (dstLength < srcLength)
|
|
{
|
|
/*
|
|
* Size is shrinking, use standard Bresenham alg.
|
|
*/
|
|
dwConst1 = 2L * dwDeltaY;
|
|
dwConst2 = 2L * (dwDeltaY - dwDeltaX);
|
|
dwP = 2L * dwDeltaY - dwDeltaX;
|
|
|
|
for (i = 0; i < dwDeltaX; i++)
|
|
{
|
|
if (dwP <= 0L)
|
|
{
|
|
dwP += dwConst1;
|
|
}
|
|
else
|
|
{
|
|
dwP += dwConst2;
|
|
code[i]++;
|
|
total++;
|
|
}
|
|
}
|
|
}
|
|
else
|
|
{
|
|
/*
|
|
* Size is increasing. Use Bresenham adapted for slope > 1, and
|
|
* use a loop invariant to generate code array. Run index i from
|
|
* 0 to dwDeltaY - 1, and when i = dwDeltaY - 1, j will
|
|
* be = dwDeltaX - 1.
|
|
*/
|
|
dwConst1 = 2L * dwDeltaX;
|
|
dwConst2 = 2L * (dwDeltaX - dwDeltaY);
|
|
dwP = 2L * dwDeltaX - dwDeltaY;
|
|
j = 0;
|
|
|
|
for (i = 0; i < dwDeltaY; i++)
|
|
{
|
|
if (dwP <= 0L)
|
|
{
|
|
dwP += dwConst1;
|
|
bStretchIndex++;
|
|
}
|
|
else
|
|
{
|
|
dwP += dwConst2;
|
|
code[j++] = ++bStretchIndex;
|
|
bStretchIndex = 0;
|
|
total += (int)code[j - 1];
|
|
}
|
|
}
|
|
|
|
/*
|
|
* UGLY fix up for wacky bug which I have no time to fix properly.
|
|
* The 'total' of entries is messed up for slopes > 4, so add the
|
|
* difference back into the array.
|
|
*/
|
|
if (total < dwDeltaY)
|
|
{
|
|
while (total < dwDeltaY)
|
|
{
|
|
j = (int)dwDeltaY - total;
|
|
k = (int)dwDeltaY / j;
|
|
for (i = 0; i < dwDeltaX; i++)
|
|
{
|
|
if (!(i % k) && (total < dwDeltaY))
|
|
{
|
|
code[i]++;
|
|
total++;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
/**********************************************************
|
|
*
|
|
* Name: GetThresholdValue
|
|
*
|
|
* Module Abstract:
|
|
* ----------------
|
|
* Determines the best threshold for the specified
|
|
* surface.
|
|
*
|
|
* Output Parameters:
|
|
* ------------------
|
|
* Threshold
|
|
*
|
|
***********************************************************
|
|
* Author: Shuhua Ge
|
|
* Date: 09/25/95
|
|
*
|
|
* Revision History:
|
|
* -----------------
|
|
* WHO WHEN WHAT/WHY/HOW
|
|
* --- ---- ------------
|
|
*
|
|
*********************************************************/
|
|
|
|
BYTE GetThresholdValue(VOID)
|
|
{
|
|
return ((BYTE) 0x0A);
|
|
}
|
|
|
|
|
|
/**********************************************************
|
|
*
|
|
* Name: MustLineRelicate
|
|
*
|
|
* Module Abstract:
|
|
* ----------------
|
|
* Checks to see if we must line replicate or if we can
|
|
* interpolate.
|
|
*
|
|
* Output Parameters:
|
|
* ------------------
|
|
* TRUE/FALSE
|
|
*
|
|
***********************************************************
|
|
* Author: Shuhua Ge
|
|
* Date: 09/25/96
|
|
*
|
|
* Revision History:
|
|
* -----------------
|
|
* WHO WHEN WHAT/WHY/HOW
|
|
* --- ---- ------------
|
|
*
|
|
*********************************************************/
|
|
|
|
BOOL MustLineReplicate (PDEV* ppdev, PDD_SURFACE_LOCAL lpSurface, WORD wVideoDepth)
|
|
{
|
|
LONG lTempThresh;
|
|
|
|
/*
|
|
* If we are double clocking the data (1280x1024 mode), we must
|
|
* replicate. We should also always replicate in Performance mode
|
|
*/
|
|
if (ppdev->bDoubleClock)
|
|
{
|
|
return (TRUE);
|
|
}
|
|
|
|
//
|
|
// Check the VCLK
|
|
//
|
|
// sge07
|
|
if (GetVCLK(ppdev) > 130000)
|
|
{
|
|
return (TRUE);
|
|
}
|
|
|
|
/*
|
|
* If we are using the chroma key feature, we can't interpolate
|
|
*/
|
|
if (lpSurface->dwReserved1 & (OVERLAY_FLG_COLOR_KEY | OVERLAY_FLG_SRC_COLOR_KEY))
|
|
{
|
|
return (TRUE);
|
|
}
|
|
|
|
lTempThresh = ppdev->lFifoThresh;
|
|
if (ppdev->pfnIsSufficientBandwidth(ppdev, wVideoDepth,
|
|
&ppdev->rOverlaySrc, &ppdev->rOverlayDest, OVERLAY_FLG_INTERPOLATE))
|
|
{
|
|
ppdev->lFifoThresh = lTempThresh;
|
|
return (FALSE);
|
|
}
|
|
ppdev->lFifoThresh = lTempThresh;
|
|
|
|
return (TRUE);
|
|
}
|
|
|
|
|
|
/**********************************************************
|
|
*
|
|
* Name: IsSufficientBandwidth
|
|
*
|
|
* Module Abstract:
|
|
* ----------------
|
|
* Determines is sufficient bandwidth exists for the requested
|
|
* configuration.
|
|
*
|
|
* Output Parameters:
|
|
* ------------------
|
|
* TRUE/FALSE
|
|
* It also sets the global parameter lFifoThresh, which gets
|
|
* programed in RegInitVideo().
|
|
*
|
|
***********************************************************
|
|
* Author: Shuhua Ge
|
|
* Date: 09/25/96
|
|
*
|
|
* Revision History:
|
|
* -----------------
|
|
* WHO WHEN WHAT/WHY/HOW
|
|
* --- ---- ------------
|
|
*
|
|
*********************************************************/
|
|
|
|
BOOL IsSufficientBandwidth(PDEV* ppdev, WORD wVideoDepth, LPRECTL lpSrc, LPRECTL lpDest, DWORD dwFlags)
|
|
{
|
|
LONG lVideoPixelsPerDWORD;
|
|
LONG lGraphicsPixelsPerDWORD;
|
|
LONG lVCLKPeriod;
|
|
LONG lTransferTime;
|
|
LONG lDWORDsWritten;
|
|
LONG lZoom;
|
|
LONG lReadPeriod;
|
|
LONG lEffReadPeriod;
|
|
LONG lWritePeriod;
|
|
LONG lEffWritePeriod;
|
|
LONG K1,K2;
|
|
LONG lTrFifoAFirst4;
|
|
LONG lTrFifoB2;
|
|
LONG lDWORDsRead;
|
|
LONG lFifoAReadPeriod;
|
|
LONG lFifoBReadPeriod;
|
|
LONG lFifoAEffWritePeriod;
|
|
LONG lFifoBEffWritePeriod;
|
|
LONG lFifoALevels;
|
|
LONG lFifoBLevels;
|
|
LONG lFifoAThresh;
|
|
LONG lFifoBThresh;
|
|
LONG lVCLK;
|
|
|
|
BYTE* pjPorts = ppdev->pjPorts;
|
|
|
|
//#define BLIT_LATENCY 8
|
|
#define CRT_FIFO_DEPTH 28
|
|
|
|
//
|
|
// Add 8 clock for BLT_LATENCY for 54446BE and later chips
|
|
//
|
|
// sge04
|
|
|
|
LONG BLIT_LATENCY = 8;
|
|
if (ppdev->flCaps & CAPS_SECOND_APERTURE)
|
|
BLIT_LATENCY += 2;
|
|
|
|
/*
|
|
* Convert input parameters
|
|
*/
|
|
if (wVideoDepth == 16)
|
|
{
|
|
lVideoPixelsPerDWORD = 2;
|
|
}
|
|
else
|
|
{
|
|
lVideoPixelsPerDWORD = 4;
|
|
}
|
|
|
|
if (ppdev->cBitsPerPixel == 8)
|
|
{
|
|
lGraphicsPixelsPerDWORD = 4;
|
|
}
|
|
else if (ppdev->cBitsPerPixel == 16)
|
|
{
|
|
lGraphicsPixelsPerDWORD = 2;
|
|
}
|
|
else if (ppdev->cBitsPerPixel == 24)
|
|
{
|
|
lGraphicsPixelsPerDWORD = 1;
|
|
}
|
|
else
|
|
return (FALSE);
|
|
|
|
lZoom = ((lpDest->right - lpDest->left) * 256) /
|
|
(lpSrc->right - lpSrc->left);
|
|
|
|
/*
|
|
* If we are double clocked, fail if we are not zoomed at least 2X
|
|
*/
|
|
if (ppdev->bDoubleClock && (lZoom < 512))
|
|
{
|
|
return (FALSE);
|
|
}
|
|
|
|
/*
|
|
* We need to get the VCLK every time since this can change
|
|
* at run-time
|
|
*/
|
|
lVCLK = GetVCLK(ppdev);
|
|
if (lVCLK == 0)
|
|
{
|
|
return (FALSE);
|
|
}
|
|
lVCLKPeriod = (LONG) ((1000000/lVCLK) + 1);
|
|
|
|
/*
|
|
* We only need to setup the following variables once!
|
|
*/
|
|
if (!ppdev->lBusWidth)
|
|
{
|
|
/*
|
|
* We will read the bus width from SR0F[4:3]
|
|
*/
|
|
CP_OUT_BYTE(pjPorts, SR_INDEX, 0x0F);
|
|
if ((CP_IN_BYTE(pjPorts, SR_DATA) & 0x18) == 0x18)
|
|
{
|
|
ppdev->lBusWidth = 8; // 64 bit bus
|
|
}
|
|
else
|
|
{
|
|
ppdev->lBusWidth = 4; // 32 bit bus
|
|
}
|
|
}
|
|
if (!ppdev->lRandom)
|
|
{
|
|
/*
|
|
* Is this EDO or regular?
|
|
*/
|
|
CP_OUT_BYTE(pjPorts, SR_INDEX, 0x0f);
|
|
if (!(CP_IN_BYTE(pjPorts, SR_DATA) & 0x4))
|
|
{
|
|
ppdev->lRandom = 7;
|
|
ppdev->lPageMiss = 7;
|
|
}
|
|
else
|
|
{
|
|
ppdev->lRandom = 6;
|
|
ppdev->lPageMiss = 6;
|
|
}
|
|
}
|
|
|
|
if (!ppdev->lMCLKPeriod)
|
|
{
|
|
LONG lMCLK;
|
|
|
|
/*
|
|
* The MCLK period is the amount of time required for one cycle.
|
|
* We will round up.
|
|
*/
|
|
CP_OUT_BYTE(pjPorts, SR_INDEX, 0x1f); // First get the MCLK frequency
|
|
lMCLK = CP_IN_BYTE(pjPorts, SR_DATA);
|
|
lMCLK *= 14318;
|
|
lMCLK >>= 3;
|
|
ppdev->lMCLKPeriod = ((1000000/lMCLK) + 1);
|
|
}
|
|
|
|
/*
|
|
* Check for the case with no color key or Y interpolation
|
|
*/
|
|
if (dwFlags == 0)
|
|
{
|
|
/*
|
|
* This mode utilizes only FIFO A. The fifo is filled with
|
|
* graphics data during regions 1 and 3, and video data during
|
|
* region 2.
|
|
*
|
|
* The normal memory sequence for this mode goes as follows.
|
|
*
|
|
* ------------------------------------------------
|
|
* | cpu/blit cycle | FIFO A fill | cpu/blit cycle ....
|
|
* ------------------------------------------------
|
|
*
|
|
* The cpu/blit cycle is interrupted when the CRT
|
|
* fifo is depleted to its threshold. Once the
|
|
* crt cycle is started, it continues until the
|
|
* FIFO A is full.
|
|
*
|
|
* Worst case condition for filling the CRT fifo :
|
|
*
|
|
* 1) CPU/blit latency ->
|
|
* 2) Random cycle for region 2 video ->
|
|
* 3) Page miss for region 2 video ->
|
|
* 4) Page miss for region 2 to region 3 transition ->
|
|
* 5) Page miss for region 3 graphics
|
|
*
|
|
* Conditions 3 and 5 depend on the location of the
|
|
* graphic screen within display memory. For 1024x768, where
|
|
* the graphics screen starts at location 0 and is offset by
|
|
* 1024 or 2048 bytes each line, condition 5 is never met.
|
|
* If a video window starts at beginning of a memory page,
|
|
* and is offset at the beggining of each line by an even
|
|
* multiple of a memory page, condition 3 is never met.
|
|
*
|
|
* Based on this worst case condition, the amount of time
|
|
* required to complete 4 transfers into the crt fifo
|
|
* is approximately:
|
|
* lTransferTime = (BLIT_LATENCY + lRandom + 3*(lPageMiss)) *
|
|
* lMCLKPeriod.
|
|
* the number of dwords transferred to the fifo
|
|
* during this time is 4 for 32 bit memory interface
|
|
* or 8 for 64 bit interface.
|
|
* lDWORDsWritten = 4 * (lBusWidth/4)
|
|
*
|
|
* During this period, data continues to be read from the crt
|
|
* fifo for screen refresh. The amount of data read,
|
|
* assuming a 1x scale is approximately:
|
|
* lDWORDsRead = tr_time/(lVideoPixelsPerDWORD * lVCLKPeriod)
|
|
*
|
|
* The difference between the dwords read and dwords
|
|
* written must be accounted for in the fifo trheshold setting
|
|
*
|
|
* lFifoThresh = (lDWORDsRead - lDWORDsWritten) rounded
|
|
* up to next even value.
|
|
*
|
|
* To determine if there is adequate bandwidth to support
|
|
* the mode, the lFifoThresh must not exceed the fifo depth.
|
|
* For the mode to work, the fifo read rate must not exceed the
|
|
* fifo write rate.
|
|
* read_rate = min(lGraphicsPixelsPerDWORD,lVideoPixelsPerDWORD) * lVCLKPeriod.
|
|
* write_rate = lMCLKPeriod * 2; -- 2 clocks per cas
|
|
*
|
|
* A special case occurs if the fifo read rate is very close to the peak
|
|
* fifo write rate. In this case the crt fill may result in a continuous
|
|
* page cycle for the entire active line. This could result in 1 extra
|
|
* page miss at the start of region2. To account for this, I will
|
|
* add 3 DWORDS to the trheshold if the read and write rates are very close
|
|
* (arbitrarily defined as within 10% of each other.
|
|
*
|
|
* Zooming
|
|
* Some modes can only be supported at video scale factors greater than 1X.
|
|
* Even when the video is zoomed, a small number of dwords must be read
|
|
* from the crt fifo at the unzoomed rate in order to prime the video
|
|
* pipeline. The video pipeline requires 10 pixel before it slows the fifo
|
|
* reads to the zoomed rate.
|
|
*
|
|
* tr_time - (lVCLKPeriod * 10/lVideoPixelsPerDWORD)
|
|
* lDWORDsRead = --------------------------------------------- + 10/lVideoPixelsPerDWORDord
|
|
* (lVideoPixelsPerDWORD * lVCLKPeriod * lZoom)
|
|
*/
|
|
lTransferTime = (BLIT_LATENCY + ppdev->lRandom + (3*(ppdev->lPageMiss))) *
|
|
ppdev->lMCLKPeriod;
|
|
|
|
lDWORDsWritten = 3 * (ppdev->lBusWidth/4);
|
|
|
|
/*
|
|
* If read rate exceeds write rate, calculate minumum zoom
|
|
* to keep everything as ints, spec the zoom as 256 times
|
|
* the fractional zoom
|
|
*/
|
|
lWritePeriod = ppdev->lMCLKPeriod * 2/(ppdev->lBusWidth/4);
|
|
lReadPeriod = lVideoPixelsPerDWORD * lVCLKPeriod;
|
|
|
|
/*
|
|
* Pick worst case of graphics and video depths for calculation
|
|
* of dwords read. This may be a little pessimistic for the
|
|
* when the graphics bits per pixel exceeds the video bits per pixel.
|
|
*/
|
|
lEffReadPeriod = (lVideoPixelsPerDWORD * lVCLKPeriod * lZoom)/256;
|
|
if (lEffReadPeriod < lWritePeriod)
|
|
{
|
|
/*
|
|
* Cannot support overlay at this zoom factor
|
|
*/
|
|
return (0);
|
|
}
|
|
|
|
if (lGraphicsPixelsPerDWORD > lVideoPixelsPerDWORD) // handle zoom factor
|
|
{
|
|
lDWORDsRead = ((lTransferTime -
|
|
(lVCLKPeriod * 10/lVideoPixelsPerDWORD))/
|
|
(lEffReadPeriod)) +
|
|
(10 / lVideoPixelsPerDWORD) + 1;
|
|
}
|
|
else
|
|
{
|
|
lDWORDsRead = (lTransferTime/
|
|
(lGraphicsPixelsPerDWORD * lVCLKPeriod)) + 1;
|
|
}
|
|
|
|
// Calculate the fifo threshold setting
|
|
ppdev->lFifoThresh = lDWORDsRead - lDWORDsWritten;
|
|
|
|
// if read rate is within 10% of write rate, up by 3 dwords
|
|
if ((11*lEffReadPeriod) < ((10*lWritePeriod*256)/lZoom))
|
|
{
|
|
ppdev->lFifoThresh += 3;
|
|
}
|
|
|
|
// fifo trheshold spec'd in QWORDS, so round up by 1 and divide by 2)
|
|
ppdev->lFifoThresh = (ppdev->lFifoThresh + 1)/2;
|
|
|
|
// Add a extra QWORD to account for fifo level sync logic
|
|
ppdev->lFifoThresh = ppdev->lFifoThresh + 1;
|
|
if (ppdev->bDoubleClock)
|
|
{
|
|
ppdev->lFifoThresh <<= 1;
|
|
}
|
|
|
|
if ((ppdev->lFifoThresh >= CRT_FIFO_DEPTH) ||
|
|
((lEffReadPeriod) < lWritePeriod))
|
|
{
|
|
return (0);
|
|
}
|
|
else
|
|
{
|
|
return (1);
|
|
}
|
|
}
|
|
|
|
/*
|
|
* Check bandwidth for Y Interpolation
|
|
*/
|
|
else if (dwFlags & OVERLAY_FLG_INTERPOLATE)
|
|
{
|
|
/*
|
|
* This mode utilizes both FIFOs A and B. During horizontal blank,
|
|
* both fifos are filled. FIFO a is then filled with graphics
|
|
* data during regions 1 and 3, and video data during region 2.
|
|
* FIFO B is filled with video data during region 2, and is idle
|
|
* during regions 1 and 3.
|
|
*
|
|
* The normal memory sequence for this mode goes as follows.
|
|
*
|
|
* ----------------------------------------------------------------
|
|
* | cpu/blit cycle | FIFO A fill | FIFO B fill | cpu/blit cycle .
|
|
* ----------------------------------------------------------------
|
|
* or
|
|
* ----------------------------------------------------------------
|
|
* | cpu/blit cycle | FIFO B fill | FIFO A fill | cpu/blit cycle .
|
|
* ----------------------------------------------------------------
|
|
*
|
|
* For this mode, the FIFO threshold must be set high enough to allow
|
|
* enough time to abort the cpu/blt, fill FIFO A, then transfer data
|
|
* into FIFO B before underflow occurs.
|
|
*
|
|
* Worst case condition for filling the CRT fifo :
|
|
*
|
|
* 1) CPU/blit latency ->
|
|
* 2) FIFO A random cycle for region 2 video ->
|
|
* 3) FIFO A page miss for region 2 video ->
|
|
* 4) FIFO A page miss for region 2 to region 3 transition ->
|
|
* 5) FIFO A page miss for region 3 graphics
|
|
* 6) FIFO A page mode fill
|
|
* 7) FIFO B random cycle
|
|
* 8) FIFO B page miss
|
|
*
|
|
* lTransferTime = lMCLKPeriod *
|
|
* (BLIT_LATENCY + lRandom + 3*(lPageMiss) +
|
|
* fifoa_remaining +
|
|
* lRandom + lPageMiss;
|
|
*
|
|
*
|
|
* The time required to fill FIFO A depends upon the read rate
|
|
* of FIFO A and the number of levels that must be filled,
|
|
* as determined by the threshold setting.
|
|
*
|
|
* The worst case fill time for the first four levels of fifo A is
|
|
* lTrFifoAFirst4 = (BLIT_LATENCY + lRandom + 3*(lPageMiss)) *
|
|
* lMCLKPeriod;
|
|
*
|
|
* The number of dwords depleted from fifo A during the
|
|
* fill of the first four levels is
|
|
* lReadPeriod = lVCLKPeriod * lVideoPixelsPerDWORD * lZoom;
|
|
* fifoa_reads_4 = lTrFifoAFirst4/lReadPeriod;
|
|
*
|
|
* The number of empty levels remaining in the fifo after
|
|
* the fill of the first four levels is
|
|
* fifoa_remaining = FIFO_DEPTH - lFifoThresh + ((4*ramwidth)/4)
|
|
* - lTrFifoAFirst4/lReadPeriod;
|
|
*
|
|
* The amount of time required to fill the remaining levels of
|
|
* fifo A is determined by the write rate and the read rate.
|
|
* lWritePeriod = lMCLKPeriod * 2; // 2 clks per cas
|
|
* lEffWritePeriod = ((lReadPeriod * lWritePeriod)/
|
|
* (lReadPeriod - lWritePeriod));
|
|
*
|
|
* tr_fifoa_remaining = fifoa_remaining * lEffWritePeriod;
|
|
*
|
|
*
|
|
* The total amount of time for the cpu/blt latency and the
|
|
* fifo A fill is
|
|
* tr_fifoa_total = lTrFifoAFirst4 + tr_fifoa_remaining;
|
|
*
|
|
* The worse case fill time for fifo B is as follows:
|
|
* lTrFifoB2 = (lRandom + lPageMiss) * lMCLKPeriod;
|
|
*
|
|
* The total amount of time elapsed from the crt request until
|
|
* the first 2 fifob cycles are completed is
|
|
* lTransferTime = tr_fifoa_total + lTrFifoB2;
|
|
*
|
|
* The number of dwords transferred to the fifo during this
|
|
* time is 2 for 32 bit memory interface or 4 for 64 bit interface.
|
|
* lDWORDsWritten = 2 * (lBusWidth/4)
|
|
*
|
|
* During this period, data continues to be read from the crt
|
|
* fifo B for screen refresh. The amount of data read,
|
|
* is approximately:
|
|
* dwords_read = lTransferTime/lReadPeriod
|
|
*
|
|
* The difference between the dwords read and dwords
|
|
* written must be accounted for in the fifo trheshold setting
|
|
*
|
|
* lFifoThresh = (dwords_read - lDWORDsWritten) rounded
|
|
* up to next even value.
|
|
*
|
|
* Since the lTransferTime and dwords_read depends on
|
|
* the threshold setting, a bit of algebra is required to determine
|
|
* the minimum setting to prevent fifo underflow.
|
|
*
|
|
* lFifoThresh = (lTransferTime/lReadPeriod) - lDWORDsWritten;
|
|
* = ((tr_fifoa_4 + lTrFifoB2 + tr_fifoa_remaining)/lReadPeriod)
|
|
* - lDWORDsWritten
|
|
* to simplify calcuation, break out constant part of equation
|
|
* K1 = ((tr_fifoa_4 + lTrFifoB2)/lReadPeriod) - lDWORDsWritten;
|
|
*
|
|
* lFifoThresh = K1 + (tr_fifoa_remaining/lReadPeriod);
|
|
* = K1 + (fifoa_remaining * lEffWritePeriod)/lReadPeriod;
|
|
* lFifoThresh = K1 +
|
|
* ((FIFO_DEPTH - lFifoThresh + 4 - (lTrFifoAFirst4/lReadPeriod)) *
|
|
* lEffWritePeriod)/lReadPeriod;
|
|
*
|
|
* break out another constant to simplify reduction
|
|
* K2 = (FIFO_DEPTH + 4 - (lTrFifoAFirst4/lReadPeriod))
|
|
* * (lEffWritePeriod/lReadPeriod);
|
|
* lFifoThresh = K1 + K2 - (lFifoThresh * (lEffWritePeriod/lReadPeriod));
|
|
* lFifoThresh * (1 + (lEffWritePeriod/lReadPeriod)) = K1 + K2;
|
|
* lFifoThresh = (K1 + K2)/(1 + (lEffWritePeriod/lReadPeriod);
|
|
*
|
|
* Once the threshold setting is determined, another calculation must
|
|
* be performed to determine if available bandwidth exists given the
|
|
* zoom factor. The worst case is assumed to be when FIFO A and
|
|
* FIFO B reach the threshold point at the same time. The sequence
|
|
* is then to abort the cpu/blt, fill fifo a, then fill fifo b.
|
|
*
|
|
* Since FIFO A is full when the fill B operation starts, I only have
|
|
* to determine how long it takes to fill FIFO B and then calculate
|
|
* the the number of dwords read from A during that time.
|
|
*
|
|
* lTransferTime = (lTrFifoB2 + (CRT_FIFO_DEPTH * lEffWritePeriod))/lReadPeriod;
|
|
* lFifoALevels = CRT_FIFO_DEPTH - (lTransferTime/lReadPeriod);
|
|
*
|
|
* if lFifoALevels < 1, then underflow condition may occur.
|
|
*/
|
|
if (lZoom < 512)
|
|
{
|
|
// 5446 requires at least a 2X zoom for Y interpolation
|
|
return (FALSE);
|
|
}
|
|
|
|
lWritePeriod = ppdev->lMCLKPeriod * 2/(ppdev->lBusWidth/4);
|
|
lReadPeriod = (lVideoPixelsPerDWORD * lVCLKPeriod * lZoom)/256;
|
|
|
|
lEffWritePeriod = ((lReadPeriod * lWritePeriod)/
|
|
(lReadPeriod - lWritePeriod));
|
|
lTrFifoAFirst4 = (BLIT_LATENCY + ppdev->lRandom + 3*(ppdev->lPageMiss)) *
|
|
ppdev->lMCLKPeriod;
|
|
lTrFifoB2 = (ppdev->lRandom + ppdev->lPageMiss) * ppdev->lMCLKPeriod;
|
|
|
|
lDWORDsWritten = 2 * (ppdev->lBusWidth/4);
|
|
K1 = ((lTrFifoAFirst4 + lTrFifoB2)/lReadPeriod) - lDWORDsWritten;
|
|
K2 = (CRT_FIFO_DEPTH + (4*(ppdev->lBusWidth/4)) -
|
|
(lTrFifoAFirst4/lReadPeriod))
|
|
* (lEffWritePeriod/lReadPeriod);
|
|
ppdev->lFifoThresh = (1 + ((K1 + K2)/(1 + (lEffWritePeriod/lReadPeriod))));
|
|
|
|
ppdev->lFifoThresh += 3;
|
|
|
|
lTransferTime = (lTrFifoB2 + (CRT_FIFO_DEPTH * lEffWritePeriod));
|
|
lFifoALevels = ((CRT_FIFO_DEPTH - (lTransferTime/lReadPeriod))/2);
|
|
if (ppdev->bDoubleClock)
|
|
{
|
|
ppdev->lFifoThresh <<= 1;
|
|
}
|
|
|
|
if ((lFifoALevels < 2) || (ppdev->lFifoThresh > (CRT_FIFO_DEPTH/2)))
|
|
{
|
|
return (0);
|
|
}
|
|
else
|
|
{
|
|
return (1);
|
|
}
|
|
}
|
|
|
|
/*
|
|
* Check bandwidth for color keying
|
|
*/
|
|
else if (dwFlags & (OVERLAY_FLG_COLOR_KEY | OVERLAY_FLG_SRC_COLOR_KEY))
|
|
{
|
|
/*
|
|
* This mode utilizes both FIFOs A and B. During horizontal blank,
|
|
* both fifos are filled. FIFO a is then filled with graphics data
|
|
* during regions 1,2 and 3. FIFO B is filled with video data
|
|
* during region 2, and is idle during regions 1 and 3.
|
|
*
|
|
* The normal memory sequence for this mode goes as follows.
|
|
*
|
|
* ----------------------------------------------------------------
|
|
* | cpu/blit cycle | FIFO A fill | FIFO B fill | cpu/blit cycle .
|
|
* ----------------------------------------------------------------
|
|
* or
|
|
* ----------------------------------------------------------------
|
|
* | cpu/blit cycle | FIFO B fill | FIFO A fill | cpu/blit cycle .
|
|
* ----------------------------------------------------------------
|
|
*
|
|
* For this mode, the FIFO threshold must be set high enough to allow
|
|
* enough time to abort the cpu/blt, fill FIFO A, then transfer data
|
|
* into FIFO B before underflow occurs. If the fifob read rate is
|
|
* greater than the fifoa read rate, then allow eough time for
|
|
* a t CPU/blt abort, followed by a fifo B fill, then a FIFO A fill.
|
|
*
|
|
* Worst case condition for filling the CRT fifo :
|
|
*
|
|
* 1) CPU/blit latency ->
|
|
* 2) FIFO A random ->
|
|
* 3) FIFO A page miss ->
|
|
* 6) FIFO A page mode fill -->
|
|
* 7) FIFO B random -->
|
|
* 8) FIFO B page miss
|
|
*
|
|
* or
|
|
*
|
|
* 1) CPU/blit latency ->
|
|
* 2) FIFO B random ->
|
|
* 3) FIFO A page miss ->
|
|
* 6) FIFO A page mode fill -->
|
|
* 7) FIFO B random -->
|
|
* 8) FIFO B page miss
|
|
*
|
|
*
|
|
* 1) lTransferTime = lMCLKPeriod *
|
|
* (BLIT_LATENCY + lRandom + lPageMiss +
|
|
* fifoa_remaining +
|
|
* lRandom + lPageMiss;
|
|
*
|
|
* or
|
|
* 2) lTransferTime = lMCLKPeriod *
|
|
* (BLIT_LATENCY + lRandom + lPageMiss +
|
|
* fifob_remaining +
|
|
* lRandom + lPageMiss;
|
|
*
|
|
*
|
|
* lFifoAReadPeriod = lVCLKPeriod * lGraphicsPixelsPerDWORD;
|
|
* lFifoBReadPeriod = (lVCLKPeriod * lVideoPixelsPerDWORD * lZoom)*256;
|
|
*
|
|
* if (lFifoAReadPeriod > lFifoBReadPeriod), then
|
|
* first fifo is fifo B, otherwise first is fifo A.
|
|
* The followinf euqations are written for a fifoa->fifob,
|
|
* sequence, but the fifob->fifoa sequence can be obtained simply
|
|
* by swapping the fifo read periods.
|
|
*
|
|
* The time required to fill a FIFO depends upon the read rate
|
|
* of the FIFO and the number of levels that must be filled,
|
|
* as determined by the threshold setting.
|
|
*
|
|
* The worst case fill time for the first four levels of fifo A is
|
|
* lTrFifoAFirst4 = (BLIT_LATENCY + lRandom + lPageMiss) *
|
|
* lMCLKPeriod;
|
|
*
|
|
* The number of dwords depleted from fifo A during the
|
|
* fill of the first four levels is
|
|
* fifoa_reads_4 = lTrFifoAFirst4/lFifoAReadPeriod;
|
|
*
|
|
* The number of empty levels remaining in the fifo after
|
|
* the fill of the first four levels is
|
|
* fifoa_remaining = FIFO_DEPTH - lFifoThresh + ((4*ramwidth)/4)
|
|
* - lTrFifoAFirst4/lFifoAReadPeriod;
|
|
*
|
|
* The amount of time required to fill the remaining levels of
|
|
* fifo A is determined by the write rate and the read rate.
|
|
* lWritePeriod = lMCLKPeriod * 2; * 2 clks per cas
|
|
* eff_write_period = ((lFifoAReadPeriod * lWritePeriod)/
|
|
* (lFifoAReadPeriod - lWritePeriod));
|
|
*
|
|
* tr_fifoa_remaining = fifoa_remaining * eff_write_period;
|
|
*
|
|
*
|
|
* The total amount of time for the cpu/blt latency and the
|
|
* fifo A fill is
|
|
* tr_fifoa_total = lTrFifoAFirst4 + tr_fifoa_remaining;
|
|
*
|
|
* The worse case fill time for fifo B is as follows:
|
|
* lTrFifoB2 = (lRandom + lPageMiss) * lMCLKPeriod;
|
|
*
|
|
* The total amount of time elapsed from the crt request until
|
|
* the first 2 fifob cycles are completed is
|
|
* lTransferTime = tr_fifoa_total + lTrFifoB2;
|
|
*
|
|
* The number of dwords transferred to the fifo during this time
|
|
* is 2 for 32 bit memory interface or 4 for 64 bit interface.
|
|
* lDWORDsWritten = 2 * (lBusWidth/4)
|
|
*
|
|
* During this period, data continues to be read from the crt
|
|
* fifo B for screen refresh. The amount of data read,
|
|
* is approximately:
|
|
* lFifoBReadPeriod = (lVCLKPeriod * lVideoPixelsPerDWORD * lZoom)/256;
|
|
* dwords_read = lTransferTime/lFifoBReadPeriod
|
|
*
|
|
* The difference between the dwords read and dwords
|
|
* written must be accounted for in the fifo trheshold setting
|
|
*
|
|
* lFifoThresh = (dwords_read - lDWORDsWritten) rounded
|
|
* up to next even value.
|
|
*
|
|
* Since the lTransferTime and dwords_read depends on the
|
|
* threshold setting, a bit of algebra is required to determine
|
|
* the minimum setting to prevent fifo underflow.
|
|
*
|
|
* lFifoThresh = (lTransferTime/lFifoBReadPeriod) - lDWORDsWritten;
|
|
* = ((tr_fifoa_4 + lTrFifoB2 + tr_fifoa_remaining)/lFifoBReadPeriod)
|
|
* - lDWORDsWritten
|
|
* to simplify calcuation, break out constant part of equation
|
|
* K1 = ((tr_fifoa_4 + lTrFifoB2)/lFifoBReadPeriod) - lDWORDsWritten;
|
|
*
|
|
* lFifoThresh = K1 + (tr_fifoa_remaining/lFifoBReadPeriod);
|
|
* = K1 + (fifoa_remaining * eff_write_period)/lFifoBReadPeriod;
|
|
* lFifoThresh = K1 +
|
|
* ((FIFO_DEPTH - lFifoThresh + 4 - (lTrFifoAFirst4/lFifoAReadPeriod)) *
|
|
* eff_write_period)/read_period;
|
|
*
|
|
* break out another constant to simplify reduction
|
|
* K2 = (FIFO_DEPTH + 4 - (lTrFifoAFirst4/lFifoAReadPeriod))
|
|
* * (eff_write_period/lFifoBReadPeriod);
|
|
* lFifoThresh = K1 + K2 - (lFifoThresh * (eff_write_period/lFifoBReadPeriod));
|
|
* lFifoThresh * (1 + (eff_write_period/read_period)) = K1 + K2;
|
|
* lFifoThresh = (K1 + K2)/(1 + (eff_write_period/lFifoBReadPeriod);
|
|
*
|
|
* Once the threshold setting is determined, another calculation must
|
|
* be performed to determine if available bandwidth exists given the
|
|
* zoom factor. The worst case is assumed to be when FIFO A and
|
|
* FIFO B reach the threshold point at the same time. The sequence
|
|
* is then to abort the cpu/blt, fill fifo a, then fill fifo b.
|
|
*
|
|
* Since FIFO A is full when the fill B operation starts, I only have
|
|
* to determine how long it takes to fill FIFO B and then calculate
|
|
* the the number of dwords read from A during that time.
|
|
*
|
|
* lTransferTime = (lTrFifoB2 + (CRT_FIFO_DEPTH * fifob_eff_write_period))/read_period;
|
|
* fifoa_levels = CRT_FIFO_DEPTH - (lTransferTime/read_period);
|
|
*
|
|
* if fifoa_levels < 1, then underflow condition may occur.
|
|
*/
|
|
lWritePeriod = ppdev->lMCLKPeriod * 2/(ppdev->lBusWidth/4);
|
|
lFifoAReadPeriod = lGraphicsPixelsPerDWORD * lVCLKPeriod;
|
|
lFifoBReadPeriod = (lVideoPixelsPerDWORD * lVCLKPeriod * lZoom)/256;
|
|
|
|
if (lFifoAReadPeriod <= lWritePeriod) // this fails, so set a big#
|
|
{
|
|
lFifoAEffWritePeriod = 5000;
|
|
}
|
|
else
|
|
{
|
|
lFifoAEffWritePeriod = ((lFifoAReadPeriod * lWritePeriod)/
|
|
(lFifoAReadPeriod - lWritePeriod));
|
|
}
|
|
|
|
if (lFifoBReadPeriod <= lWritePeriod) // this fails, so set a big#
|
|
{
|
|
lFifoBEffWritePeriod = 5000;
|
|
}
|
|
else
|
|
{
|
|
lFifoBEffWritePeriod = ((lFifoBReadPeriod * lWritePeriod)/
|
|
(lFifoBReadPeriod - lWritePeriod));
|
|
}
|
|
|
|
if ((lFifoAReadPeriod == 0) || (lFifoBReadPeriod == 0) ||
|
|
(lWritePeriod == 0))
|
|
{
|
|
return (FALSE);
|
|
}
|
|
|
|
// These values should be the same for bot the fifoa->fifob
|
|
// and fifob->fifoa sequences
|
|
lTrFifoAFirst4 = (BLIT_LATENCY + ppdev->lRandom + 2*(ppdev->lPageMiss)) *
|
|
ppdev->lMCLKPeriod;
|
|
lTrFifoB2 = (ppdev->lRandom + ppdev->lPageMiss) * ppdev->lMCLKPeriod;
|
|
|
|
lDWORDsWritten = 2 * (ppdev->lBusWidth/4);
|
|
|
|
// Since I'm not sure which sequence is worse
|
|
// Try both then pick worse case results
|
|
|
|
// For fifoa->fifob sequence
|
|
K1 = ((lTrFifoAFirst4 + lTrFifoB2)/lFifoBReadPeriod) - lDWORDsWritten;
|
|
K2 = (CRT_FIFO_DEPTH + (4*(ppdev->lBusWidth/4)) -
|
|
(lTrFifoAFirst4/lFifoAReadPeriod))
|
|
* (lFifoAEffWritePeriod/lFifoBReadPeriod);
|
|
lFifoAThresh = (1 + ((K1 + K2)/
|
|
(1 + (lFifoAEffWritePeriod/lFifoBReadPeriod))));
|
|
|
|
lFifoAThresh += 3;
|
|
|
|
lTransferTime = (lTrFifoB2 + (CRT_FIFO_DEPTH * lFifoBEffWritePeriod));
|
|
lFifoALevels = ((CRT_FIFO_DEPTH - (lTransferTime/lFifoAReadPeriod))/2);
|
|
|
|
// For fifob->fifoa sequence
|
|
K1 = ((lTrFifoAFirst4 + lTrFifoB2)/lFifoAReadPeriod) - lDWORDsWritten;
|
|
K2 = (CRT_FIFO_DEPTH + (4*(ppdev->lBusWidth/4)) -
|
|
(lTrFifoAFirst4/lFifoBReadPeriod))
|
|
* (lFifoBEffWritePeriod/lFifoAReadPeriod);
|
|
|
|
lFifoBThresh = (1 + ((K1 + K2)/
|
|
(1 + (lFifoBEffWritePeriod/lFifoAReadPeriod))));
|
|
|
|
lFifoBThresh += 3;
|
|
|
|
lTransferTime = (lTrFifoB2 + (CRT_FIFO_DEPTH * lFifoAEffWritePeriod));
|
|
lFifoBLevels = ((CRT_FIFO_DEPTH - (lTransferTime/lFifoBReadPeriod))/2);
|
|
|
|
if (lFifoAThresh > lFifoBThresh)
|
|
{
|
|
ppdev->lFifoThresh = lFifoAThresh;
|
|
}
|
|
else
|
|
{
|
|
ppdev->lFifoThresh = lFifoBThresh;
|
|
}
|
|
if (ppdev->bDoubleClock)
|
|
{
|
|
ppdev->lFifoThresh <<= 1;
|
|
}
|
|
|
|
if ((lFifoBLevels <0) || (lFifoALevels < 0) ||
|
|
(ppdev->lFifoThresh > (CRT_FIFO_DEPTH/2)))
|
|
{
|
|
return (0);
|
|
}
|
|
else
|
|
{
|
|
return (1);
|
|
}
|
|
}
|
|
return (1); // Should never get here!!
|
|
}
|
|
|
|
|
|
|
|
// chu03
|
|
/**********************************************************
|
|
*
|
|
* Name: Is5480SufficientBandwidth
|
|
*
|
|
* Module Abstract:
|
|
* ----------------
|
|
* This function reads the current MCLK, VLCK, bus width, etc.
|
|
* and determines whether the chip has sufficient bandwidth
|
|
* to handle the requested mode.
|
|
*
|
|
* Output Parameters:
|
|
* ------------------
|
|
* none
|
|
*
|
|
***********************************************************/
|
|
|
|
// -------------------------------------------------------------
|
|
// Overview by John Schafer
|
|
// -------------------------------------------------------------
|
|
// The memory arbitration scheme for the 5480 has changed
|
|
// significantly from the 5446. The 5480 is set up on a first
|
|
// come, first serve basis. If more than 1 request arrive at
|
|
// the same clock edge, then the BankSelect is used to determine
|
|
// which request to acknowledge first. Using SDRAM, the row
|
|
// access to a differennt bank can be hidden, which saves up to
|
|
// 7 MCLKs. If all bank selects for the concurrent requests are
|
|
// the same, the default prority is FIFOA->FIFOB->FIFOC->VCAP.
|
|
//
|
|
// The FIFO sizes for the 5480 are as follows:
|
|
// FIFOA, FIFOB, FIFOC : 32x64
|
|
// VCAP : 16x64 (two 8x64 fifos)
|
|
//
|
|
// The Y interpolation mode for the 5480 is "free" due to
|
|
// the embedded line store. The available mode combinations
|
|
// for the 5480 which effect bandwidth are :
|
|
//
|
|
// 1) Capture enabled, 1 video window, no occlusion, not 420 format
|
|
// 2) Capture enabled, 1 video window, no occlusion, 420 format
|
|
// 3) Capture enabled, 1 video window, occlusion, not 420 format
|
|
// 4) Capture enabled, 1 video window, occlusion, 420 format
|
|
// 5) Capture enabled, 2 video windows (occlusion implied)
|
|
// 6) Capture disabled, 1 video window, no occlusion, not 420 format
|
|
// 7) Capture disabled, 1 video window, no occlusion, 420 format
|
|
// 8) Capture disabled, 1 video window, occlusion, not 420 format
|
|
// 9) Capture disabled, 1 video window, occlusion, 420 format
|
|
// 10) Capture disabled, 2 video windows (occlusion implied)
|
|
//
|
|
//
|
|
// -------------------------------------------------------------
|
|
// FIFO threshold description
|
|
// -------------------------------------------------------------
|
|
// The memory requests are generated based on the threshold settings
|
|
// of each FIFO. CRT FIFO thresholds during non-video window lines
|
|
// are determined by SR16(3:0). CRT FIFO thresholds during video
|
|
// window lines are determined by CR5C(3:0).
|
|
// The VCAP fifo threshold is a fixed setting of 8 QWORDS (half).
|
|
//
|
|
// The 4 bit threshold for FIFOs A,B, and C indicate the FIFO
|
|
// level in double QWORDS at which the FIFO request is asserted.
|
|
// For example, a setting of 4 indicates that the request is
|
|
// generated when the FIFO level is reduced to 8 QWORDS.
|
|
// A setting of 0 is a special case which indicates that the
|
|
// FIFO must be full to prevent a request (i.e. 32 QWORDS).
|
|
//
|
|
// The objective of the bandwidth equations is to calculate
|
|
// the optimum threshold setting and determine which display
|
|
// modes may be supported for given MCLK and VCLK frequencies.
|
|
//
|
|
// The critical parameters which determine the bandwidth limits
|
|
// are the read and effective write rates for each FIFO.
|
|
//
|
|
// -------------------------------------------------------------
|
|
// FIFO read/write rates for CRT FIFOs
|
|
// -------------------------------------------------------------
|
|
// The read rate for FIFO A (graphics FIFO) is determined by
|
|
// the graphics pixel depth and the VCLK frequency.
|
|
// fa_read_rate = gr_bytes_per_pixel * vclk_period
|
|
//
|
|
// The read rates for FIFO B and C are determined differently
|
|
// depending on display mode. For 420 format the read periods
|
|
// in nanosecs per byte are as follows:
|
|
// fb_read_period = ((vclk_period*4) * hzoom) / hdecimate;
|
|
// fc_read_period = ((vclk_period*4) * hzoom) / hdecimate;
|
|
//
|
|
// In this equation hdecimate is specified as 1/decimation_scale,
|
|
// i.e a 1/2 decimate implies hdecimate = 2
|
|
//
|
|
// For non 420 format the rates are:
|
|
// fb_read_period = ((vclk_period/vw_bytes_per_pixel) * hzoom) /
|
|
// hdecimate;
|
|
// fc_read_period = (vclk_period/vw_bytes_per_pixel);
|
|
//
|
|
// Since the FIFOs can be read and written simultaneously,
|
|
// the effective write rate is determined by the actual fifo
|
|
// write rate and tje fifo read rate. The actual write rate is based
|
|
// on single mclk display memory reads. The memory read period is
|
|
// calculated in terms of nanoseconds per byte.
|
|
//
|
|
// bytes_per_memory_transfer is equal to 4 for 32 bit i/f, 8 for 64 bit i/f
|
|
// mem_read_period = mclk_period/bytes_per_mem_transfer
|
|
// fa_eff_write_period = (mem_read_period * fa_read_period)/
|
|
// (fa_read_period - mem_read_period);
|
|
// fb_eff_write_period = (mem_read_period * fb_read_period)/
|
|
// (fb_read_period - mem_read_period);
|
|
// fc_eff_write_period = (mem_read_period * fc_read_period)/
|
|
// (fc_read_period - mem_read_period);
|
|
// -------------------------------------------------------------
|
|
// FIFO read/write rates for VCAP fifo
|
|
// -------------------------------------------------------------
|
|
// The video capture write rate is based on the data rate
|
|
// from the video capture interface. Since the video capture
|
|
// interface can perform format conversion (e.g. 422->PackJR) and
|
|
// decimation, the capture data rate may be smaller than the actual
|
|
// video port data rate. The capture period in the following equation
|
|
// is defined in terms of nanoseconds per byte. The decimation factor
|
|
// may vary from 1 to 1/256.
|
|
//
|
|
// vcap_write_period = (vport_pixel_period/capture_bytes_per_pixel) *
|
|
// (vport_decimation);
|
|
// In this equation vport_decimation is specified as 1/decimation_scale,
|
|
// i.e a 1/2 decimate implies vport_decimation = 2
|
|
//
|
|
//
|
|
// Since the VCAP fifo can be read and written simultaneously,
|
|
// the effective read rate is determined by the fifo write rate as well
|
|
// as the actual fifo read rate. The actual fifo read rate is based on two
|
|
// memory clock cycle display memory writes. The calculations are in terms
|
|
// of nanoseconds per byte.
|
|
// bytes_per_memory_transfer = 4 for 32 bit i/f, or 8 for 64 bit i/f
|
|
// mem_write_period = 2 * mclk_period/bytes_per_mem_transfer
|
|
//
|
|
// vcap_eff_read_period = (mem_write_period * vcap_write_period)/
|
|
// (vcap_write_period - mem_write_period);
|
|
//
|
|
// -------------------------------------------------------------------
|
|
// How to determine if FIFO ABC underflow or VCAP fifo overflow occurs
|
|
// -------------------------------------------------------------------
|
|
//
|
|
// I will examine a few worst case scenarios to determine if adequate
|
|
// bandwidth exists to support a given mode.
|
|
//
|
|
// Case #1 - start of graphics line where all 3 CRT fifos must be filled
|
|
//
|
|
// This condition occurs after hsync when the 3 CRT FIFOs are being
|
|
// prefilled before the start of the active line. The only risk here is
|
|
// that the video capture fifo may overflow during the consecutive fills
|
|
// of fifos A,B, and C. The threshold setting does not matter since the
|
|
// CRT fifos are cleared on reset and thus guaranteed to be empty.
|
|
//
|
|
// For a 32 bit memory interface :
|
|
// fabc_fill_time = (BLIT_LATENCY * mclk_period) +
|
|
// 3 * ((RAS_PRECHARGE + 64) * mclk_period)
|
|
//
|
|
// For a 64 bit memory interface :
|
|
// fabc_fill_time = (BLIT_LATENCY * mclk_period) +
|
|
// 3 * ((RAS_PRECHARGE + 32) * mclk_period)
|
|
//
|
|
// A capture fifo overflow occurs if fabc_fill_time is greater than
|
|
// VCAP fill time based on the worst case 30 MB/s capture rate.
|
|
//
|
|
// For a worst case memory interface scenario, let's assume a 32 bit
|
|
// interface with a 66 MHz memory clock, a blit latency of 10 mclks,
|
|
// and a ras precharge of 7 mclks. The fabc_fill_time is
|
|
// then
|
|
// fabc_fill_time = (10 * 15.2) +
|
|
// 3 * ((64 + 7) * 15.2) = 3390 ns
|
|
//
|
|
// Assuming the worst case 30 MB/s capture rate, the number of
|
|
// bytes written to the capture fifo during the fabc_fill_time is
|
|
// 3390 ns * (1 byte/33 ns) = 103 bytes
|
|
//
|
|
// Since the capture fifo is 128 bytes deep, the worst case scenario
|
|
// is OK so long as the capture fifo is emptied prior to the fabc_fill.
|
|
//
|
|
//
|
|
//
|
|
// Case #2 - Consecutive requests
|
|
//
|
|
// It seems that the worst case for servicing of requests is when the requests occur
|
|
// on consecutive mclks with the order of requests being from the slowest to the
|
|
// fastest data consumer. In other words, the first to be serviced is the capture fifo,
|
|
// then the 3 CRT fifos in the order of decreasing read_period.
|
|
//
|
|
// First calculate actual and effective read and write periods as decribed above.
|
|
// Then determine how many requests are active, this is a maximum of 4 if capture
|
|
// is enabled and all 3 CRT fifos are enabled. Assume that the capture rate
|
|
// is the slowest and thus is always serviced first. Then order the active
|
|
// CRT requests as f1 through f3, where f1 has the longest read period and
|
|
// f3 has the shortest.
|
|
//
|
|
// The sequence of events then becomes:
|
|
// empty vcap -> fill 1 -> fill 2 -> fill 3
|
|
//
|
|
//
|
|
// Depending on the number of active crt fifos, the fill 2 and fill 3 operations may
|
|
// be ommitted. The vcap empty is obviously ommitted if capture is not enabled.
|
|
//
|
|
// Now step through the sequence and verify that crt fifo underflows and capture
|
|
// underflows do not occur.
|
|
//
|
|
// If capture is enabled, calculate the latency and empty times
|
|
// vcap_latency = (BLIT_LATENCY + RAS_PRECHARGE) * mclk_period;
|
|
// vcap_bytes_to_empty = CAP_FIFO_DEPTH;
|
|
// vcap_empty_time = (vcap_read_period * vcap_bytes_to_empty);
|
|
// Since one of the capture fifos continues to fill while the other is being
|
|
// emptied, calculate the number of filled levels in the capture fifo at
|
|
// the end of the memory transfer.
|
|
// vcap_levels_remaining = (vcap_latency + vcap_empty_time)/vcap_write_period;
|
|
// If the number of levels filled exceeds the fifo depth, then an overflow occurred.
|
|
//
|
|
// Note that the VCAP FIFO operates differently than the CRT fifos. The VCAP
|
|
// FIFO operates as 2 8x64 FIFOs. A memory request is asserted when one of the
|
|
// FIFOs is full. The capture interface then fills the other fifo while the
|
|
// full fifo is being serviced by the sequencer. Using this method, the transfer
|
|
// to memory is always 16 QWORDs for VCAP data (except special end of line conditions).
|
|
//
|
|
// Now check fifo 1. If capture was enabled then the latency for fifo 1 is:
|
|
// f1_latency = vcap_latency + vcap_empty_time +
|
|
// (BLIT_LATENCY + RAS_PRECHARGE) * mclk_period;
|
|
//
|
|
// otherwise the latency is:
|
|
// f1_latency = (BLIT_LATENCY + RAS_PRECHARGE) * mclk_period;
|
|
//
|
|
// Calculate the number of empty levels in fifo 1, i.e. the number of bytes
|
|
// that must be filled.
|
|
// f1_bytes_to_fill = ((16-threshold) * 16) + (f1_latency/f1_read_period);
|
|
// If the number of levels to be filled exceeds the fifo depth, then an underflow occurred.
|
|
// Calculate the fill time based on the effective fifo write rate.
|
|
// f1_fill_time = (f1_eff_write_period * f1_bytes_to_fill);
|
|
//
|
|
// If fifo_2 is active, calculate its latency and bytes to be filled.
|
|
// f2_latency = f1_latency + f1_fill_time +
|
|
// (RAS_PRECHARGE * mclk_period);
|
|
// f2_bytes_to_fill = ((16-threshold) * 16) + (f2_latency/f2_read_period);
|
|
// If the number of levels to be filled exceeds the fifo depth, then an underflow occurred.
|
|
// Calculate the fill time based on the effective fifo write rate.
|
|
// f2_fill_time = (f2_eff_write_period * f2_bytes_to_fill);
|
|
//
|
|
// If fifo_2 is active, calculate its latency and bytes to be filled.
|
|
// f3_latency = f2_latency + f2_fill_time +
|
|
// (RAS_PRECHARGE * mclk_period);
|
|
// f3_bytes_to_fill = ((16-threshold) * 16) + (f3_latency/f3_read_period);
|
|
// If the number of levels to be filled exceeds the fifo depth, then an underflow occurred.
|
|
// Calculate the fill time based on the effective fifo write rate.
|
|
// f3_fill_time = (f3_eff_write_period * f3_bytes_to_fill);
|
|
//
|
|
// Now go back to the start of sequence and make sure that none of the FIFOs
|
|
// have already initiated another request. The totla latency is the amount
|
|
// of time required to execute the entire sequence.
|
|
//
|
|
// Check vcap fif status if capture is enabled,
|
|
// vcap_latency = total_latency;
|
|
// vcap_bytes_to_empty = (total_latency/vcap_write_period);
|
|
//
|
|
// Check fifo 1 status
|
|
// f1_latency = (total_latency - f1_latency - f1_fill_time);
|
|
// f1_bytes_to_fill = (f1_latency/f1_read_period);
|
|
//
|
|
// Check fifo 2 status if active
|
|
// f2_latency = (total_latency - f1_latency - f1_fill_time);
|
|
// f3_bytes_to_fill = (f1_latency/f1_read_period);
|
|
//
|
|
//***************************************************************************
|
|
static BOOL Is5480SufficientBandwidth (PDEV* ppdev,
|
|
WORD wVideoDepth,
|
|
LPRECTL lpSrc,
|
|
LPRECTL lpDest,
|
|
DWORD dwFlags)
|
|
{
|
|
long lVideoPixelsPerDWORD;
|
|
long lGraphicsPixelsPerDWORD;
|
|
long lCapturePixelsPerDWORD;
|
|
long lVideoBytesPerPixel;
|
|
long lGraphicsBytesPerPixel;
|
|
long lCaptureBytesPerPixel;
|
|
long lVCLKPeriod;
|
|
long lZoom;
|
|
long lFifoAReadPeriod;
|
|
long lFifoBReadPeriod;
|
|
long lFifoCReadPeriod;
|
|
long lFifoAEffWritePeriod;
|
|
long lFifoBEffWritePeriod;
|
|
long lFifoCEffWritePeriod;
|
|
long lMemReadPeriod;
|
|
long lVPortPixelPeriod;
|
|
long lVCapReadPeriod;
|
|
long lVCapWritePeriod;
|
|
long lFifo1ReadPeriod;
|
|
long lFifo2ReadPeriod;
|
|
long lFifo3ReadPeriod;
|
|
long lFifo1EffWritePeriod;
|
|
long lFifo2EffWritePeriod;
|
|
long lFifo3EffWritePeriod;
|
|
long lVCapLatency;
|
|
long lVCapBytesToEmpty;
|
|
long lVCapEmptyTime;
|
|
long lVCapLevelRemaining;
|
|
long lFifo1Latency;
|
|
long lFifo1BytesToFill;
|
|
long lFifo1FillTime;
|
|
long lFifo2Latency;
|
|
long lFifo2BytesToFill;
|
|
long lFifo2FillTime;
|
|
long lFifo3Latency;
|
|
long lFifo3BytesToFill;
|
|
long lFifo3FillTime;
|
|
long lThreshold;
|
|
int CrtFifoCount;
|
|
BOOL bCapture;
|
|
BOOL bFifoAEnable;
|
|
BOOL bFifoBEnable;
|
|
BOOL bFifoCEnable;
|
|
BOOL bModePass;
|
|
long lHorizDecimate;
|
|
long lVPortDecimate;
|
|
long lTotalLatency;
|
|
long lVCLK;
|
|
UCHAR tempB ;
|
|
BYTE* pjPorts = ppdev->pjPorts ;
|
|
|
|
#define CAP_FIFO_DEPTH 64
|
|
#define RAS_PRECHARGE 7
|
|
#define BLIT_LATENCY 9
|
|
|
|
//
|
|
// Parameter checking
|
|
//
|
|
lFifo2EffWritePeriod = 0;
|
|
lFifo3EffWritePeriod = 0;
|
|
lHorizDecimate = 1;
|
|
lVPortDecimate = 1;
|
|
|
|
//
|
|
// Convert input parameters
|
|
//
|
|
if (wVideoDepth == 16)
|
|
{
|
|
lVideoPixelsPerDWORD = 2;
|
|
lCapturePixelsPerDWORD = 2;
|
|
}
|
|
else if (wVideoDepth == 8)
|
|
{
|
|
lVideoPixelsPerDWORD = 4;
|
|
lCapturePixelsPerDWORD = 4;
|
|
}
|
|
else return (FALSE);
|
|
|
|
if (ppdev->cBitsPerPixel == 8)
|
|
{
|
|
lGraphicsPixelsPerDWORD = 4;
|
|
}
|
|
else if (ppdev->cBitsPerPixel == 16)
|
|
{
|
|
lGraphicsPixelsPerDWORD = 2;
|
|
}
|
|
else if (ppdev->cBitsPerPixel == 24)
|
|
{
|
|
lGraphicsPixelsPerDWORD = 1;
|
|
}
|
|
else return (FALSE);
|
|
|
|
|
|
lGraphicsBytesPerPixel = 4 / lGraphicsPixelsPerDWORD;
|
|
lVideoBytesPerPixel = 4 / lVideoPixelsPerDWORD;
|
|
lCaptureBytesPerPixel = 4 / lCapturePixelsPerDWORD;
|
|
|
|
lZoom = (lpDest->right - lpDest->left) /
|
|
(lpSrc->right - lpSrc->left);
|
|
|
|
if (lZoom < 1)
|
|
lZoom = 1;
|
|
|
|
//
|
|
// We need to get the VCLK every time since this can change at run-time
|
|
//
|
|
lVCLK = GetVCLK(ppdev);
|
|
lVCLKPeriod = (long) ((1024000000l/lVCLK) + 1);
|
|
|
|
//
|
|
// Video port at 13.5 MHz
|
|
//
|
|
lVPortPixelPeriod = (long) ((10240000) / 135);
|
|
|
|
|
|
//
|
|
// Graphics CRT FIFO read rate
|
|
//
|
|
lFifoAReadPeriod = lGraphicsBytesPerPixel * lVCLKPeriod;
|
|
|
|
//
|
|
// Video FIFO read rate
|
|
//
|
|
if(dwFlags & OVERLAY_FLG_YUVPLANAR)
|
|
{
|
|
lFifoBReadPeriod = ((lVCLKPeriod * 4) * lZoom) / lHorizDecimate;
|
|
lFifoCReadPeriod = ((lVCLKPeriod * 4) * lZoom) / lHorizDecimate;
|
|
}
|
|
else
|
|
{
|
|
lFifoBReadPeriod = ((lVCLKPeriod / lVideoBytesPerPixel) * lZoom)
|
|
/ lHorizDecimate;
|
|
lFifoCReadPeriod = lVCLKPeriod / lVideoBytesPerPixel;
|
|
}
|
|
|
|
|
|
DISPDBG ((2, "lFifoAReadPeriod = %ld, lFifoBReadPeriod=%ld\n",
|
|
lFifoAReadPeriod, lFifoBReadPeriod));
|
|
|
|
DISPDBG ((2, "lFifoCReadPeriod = %ld\n", lFifoCReadPeriod));
|
|
|
|
//
|
|
// Video capture write period
|
|
//
|
|
lVCapWritePeriod = (lVPortPixelPeriod / lCaptureBytesPerPixel)
|
|
* lVPortDecimate;
|
|
|
|
if (!ppdev->lBusWidth)
|
|
{
|
|
//
|
|
// We will read the bus width from SR0F[4:3]
|
|
//
|
|
CP_OUT_BYTE (pjPorts, SR_INDEX, 0x0F) ;
|
|
|
|
if ((CP_IN_BYTE(pjPorts, SR_DATA) & 0x18) == 0x18)
|
|
ppdev->lBusWidth = 8; // 64 bit bus
|
|
else
|
|
ppdev->lBusWidth = 4; // 32 bit bus
|
|
}
|
|
|
|
if (!ppdev->lMCLKPeriod)
|
|
{
|
|
LONG lMCLK;
|
|
|
|
//
|
|
// The MCLK period is the amount of time required for one cycle.
|
|
// We will round up.
|
|
//
|
|
CP_OUT_BYTE (pjPorts, SR_INDEX, 0x1F) ; // First get the MCLK frequency
|
|
lMCLK = CP_IN_BYTE(pjPorts, SR_DATA);
|
|
lMCLK *= 14318;
|
|
lMCLK >>= 3;
|
|
ppdev->lMCLKPeriod = (long) ((1024000000l/lMCLK) + 1);
|
|
}
|
|
|
|
//
|
|
// Calculate CRT effective read and write periods
|
|
//
|
|
lMemReadPeriod = ppdev->lMCLKPeriod / ppdev->lBusWidth;
|
|
|
|
if (lFifoAReadPeriod == lMemReadPeriod)
|
|
lFifoAEffWritePeriod = 1000000000;
|
|
else
|
|
lFifoAEffWritePeriod = (lMemReadPeriod * lFifoAReadPeriod) /
|
|
(lFifoAReadPeriod - lMemReadPeriod);
|
|
|
|
if (lFifoBReadPeriod == lMemReadPeriod)
|
|
lFifoBEffWritePeriod = 1000000000;
|
|
else
|
|
lFifoBEffWritePeriod = (lMemReadPeriod * lFifoBReadPeriod) /
|
|
(lFifoBReadPeriod - lMemReadPeriod);
|
|
|
|
if (lFifoCReadPeriod == lMemReadPeriod)
|
|
lFifoCEffWritePeriod = 1000000000;
|
|
else
|
|
lFifoCEffWritePeriod = (lMemReadPeriod * lFifoCReadPeriod) /
|
|
(lFifoCReadPeriod - lMemReadPeriod);
|
|
|
|
//
|
|
// Video capture read period
|
|
//
|
|
lVCapReadPeriod = (2 * ppdev->lMCLKPeriod) / ppdev->lBusWidth;
|
|
|
|
|
|
if (dwFlags & OVERLAY_FLG_CAPTURE) // is capture enable ?
|
|
bCapture = TRUE;
|
|
else
|
|
bCapture = FALSE;
|
|
|
|
|
|
if (dwFlags & OVERLAY_FLG_YUVPLANAR) // is 420 format
|
|
{
|
|
if (dwFlags & (OVERLAY_FLG_COLOR_KEY | OVERLAY_FLG_SRC_COLOR_KEY)) // occlusion
|
|
{ // one video window, occlusion, 420 format
|
|
bFifoAEnable = TRUE;
|
|
bFifoBEnable = TRUE;
|
|
bFifoCEnable = TRUE;
|
|
}
|
|
else
|
|
{ // one video window, no occlusion, 420 format
|
|
bFifoAEnable = FALSE;
|
|
bFifoBEnable = TRUE;
|
|
bFifoCEnable = TRUE;
|
|
}
|
|
}
|
|
else // not 420 format
|
|
{
|
|
if (dwFlags & (OVERLAY_FLG_COLOR_KEY | OVERLAY_FLG_SRC_COLOR_KEY)) // occlusion
|
|
{
|
|
if (dwFlags & OVERLAY_FLG_TWO_VIDEO)
|
|
{ // Two video windows, occlusion, not 420 format
|
|
bFifoAEnable = TRUE;
|
|
bFifoBEnable = TRUE;
|
|
bFifoCEnable = TRUE;
|
|
}
|
|
else
|
|
{ // one video window, occlusion, not 420 format
|
|
bFifoAEnable = TRUE;
|
|
bFifoBEnable = TRUE;
|
|
bFifoCEnable = FALSE;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
// one video window, no occlusion, not 420 format
|
|
bFifoAEnable = FALSE;
|
|
bFifoBEnable = TRUE;
|
|
bFifoCEnable = FALSE;
|
|
}
|
|
}
|
|
|
|
DISPDBG ((4, " FIFOA = %s, FIFOB= %s, FIFOC = %s\n",
|
|
bFifoAEnable ? "yes" : "no",
|
|
bFifoBEnable ? "yes" : "no",
|
|
bFifoCEnable ? "yes" : "no"));
|
|
|
|
lFifo1ReadPeriod = 0;
|
|
lFifo2ReadPeriod = 0;
|
|
lFifo3ReadPeriod = 0;
|
|
|
|
if (bFifoAEnable)
|
|
{
|
|
if (((lFifoAReadPeriod >= lFifoBReadPeriod) || !bFifoBEnable) &&
|
|
// A slower than or equal than B) and
|
|
((lFifoAReadPeriod >= lFifoCReadPeriod) || !bFifoCEnable))
|
|
// A slower than or equal C
|
|
{
|
|
lFifo1ReadPeriod = lFifoAReadPeriod;
|
|
lFifo1EffWritePeriod = lFifoAEffWritePeriod;
|
|
}
|
|
else if (((lFifoAReadPeriod >= lFifoBReadPeriod) || !bFifoBEnable) ||
|
|
// A slower than or equal B
|
|
((lFifoAReadPeriod >= lFifoCReadPeriod) || !bFifoCEnable))
|
|
// A slower than or equal C
|
|
{
|
|
lFifo2ReadPeriod = lFifoAReadPeriod;
|
|
lFifo2EffWritePeriod = lFifoAEffWritePeriod;
|
|
}
|
|
else // A not slower than A or B
|
|
{
|
|
lFifo3ReadPeriod = lFifoAReadPeriod;
|
|
lFifo3EffWritePeriod = lFifoAEffWritePeriod;
|
|
}
|
|
}
|
|
|
|
DISPDBG ((2, "After bFifoAEnable")) ;
|
|
DISPDBG ((2, "lFifo1ReadPeriod = %ld, lFifo2ReadPeriod=%ld",
|
|
lFifo1ReadPeriod, lFifo2ReadPeriod)) ;
|
|
DISPDBG ((2, "lFifo3ReadPeriod = %ld", lFifo3ReadPeriod)) ;
|
|
|
|
|
|
if (bFifoBEnable)
|
|
{
|
|
if (((lFifoBReadPeriod > lFifoAReadPeriod) || !bFifoAEnable) &&
|
|
// B slower than A and
|
|
((lFifoBReadPeriod >= lFifoCReadPeriod) || !bFifoCEnable))
|
|
// slower than or equal A
|
|
{
|
|
lFifo1ReadPeriod = lFifoBReadPeriod;
|
|
lFifo1EffWritePeriod = lFifoBEffWritePeriod;
|
|
}
|
|
else if (((lFifoBReadPeriod > lFifoAReadPeriod) || !bFifoAEnable) ||
|
|
// B slower than A or
|
|
((lFifoBReadPeriod >= lFifoCReadPeriod) || !bFifoCEnable))
|
|
// B slower than or equal C
|
|
{
|
|
|
|
lFifo2ReadPeriod = lFifoBReadPeriod;
|
|
lFifo2EffWritePeriod = lFifoBEffWritePeriod;
|
|
|
|
}
|
|
else
|
|
// (B not slower than A ) and (B not slower than or equal C)
|
|
{
|
|
lFifo3ReadPeriod = lFifoBReadPeriod;
|
|
lFifo3EffWritePeriod = lFifoBEffWritePeriod;
|
|
}
|
|
}
|
|
else
|
|
|
|
|
|
|
|
DISPDBG ((4, "After bFifoBEnable")) ;
|
|
DISPDBG ((4, "lFifo1ReadPeriod = %ld, lFifo2ReadPeriod=%ld",
|
|
lFifo1ReadPeriod, lFifo2ReadPeriod)) ;
|
|
DISPDBG ((4, "lFifo3ReadPeriod = %ld", lFifo3ReadPeriod)) ;
|
|
|
|
if (bFifoCEnable)
|
|
{
|
|
if (((lFifoCReadPeriod > lFifoAReadPeriod) || !bFifoAEnable) &&
|
|
// C slower than A and
|
|
((lFifoCReadPeriod > lFifoBReadPeriod) || !bFifoBEnable))
|
|
// C slower than B
|
|
{
|
|
lFifo1ReadPeriod = lFifoCReadPeriod;
|
|
lFifo1EffWritePeriod = lFifoCEffWritePeriod;
|
|
}
|
|
else if (((lFifoCReadPeriod > lFifoAReadPeriod) || !bFifoAEnable) ||
|
|
// C slower than A or
|
|
((lFifoCReadPeriod > lFifoBReadPeriod) || !bFifoBEnable))
|
|
// C slower than B
|
|
{
|
|
lFifo2ReadPeriod = lFifoCReadPeriod;
|
|
lFifo2EffWritePeriod = lFifoCEffWritePeriod;
|
|
}
|
|
else
|
|
{
|
|
// C not slower than A and C not slower than B
|
|
lFifo3ReadPeriod = lFifoCReadPeriod;
|
|
lFifo3EffWritePeriod = lFifoCEffWritePeriod;
|
|
}
|
|
}
|
|
|
|
DISPDBG ((4, "After bFifoCEnable")) ;
|
|
DISPDBG ((4, "lFifo1ReadPeriod = %ld, lFifo2ReadPeriod=%ld",
|
|
lFifo1ReadPeriod, lFifo2ReadPeriod)) ;
|
|
DISPDBG ((4, "lFifo3ReadPeriod = %ld", lFifo3ReadPeriod)) ;
|
|
DISPDBG ((4, "lFifo1EffWritePeriod = %ld, lFifo2EffWritePeriod = %ld",
|
|
lFifo1EffWritePeriod, lFifo2EffWritePeriod)) ;
|
|
DISPDBG ((4, " lFifo3EffWritePeriod = %ld", lFifo3EffWritePeriod)) ;
|
|
DISPDBG ((4, " lFifoAEffWritePeriod = %ld, lFifoBEffWritePeriod = %ld",
|
|
lFifoAEffWritePeriod, lFifoBEffWritePeriod)) ;
|
|
DISPDBG ((4, " lFifoCEffWritePeriod = %ld", lFifoCEffWritePeriod)) ;
|
|
|
|
bModePass = FALSE;
|
|
lThreshold = 1;
|
|
|
|
CrtFifoCount = 0;
|
|
if (bFifoAEnable) CrtFifoCount++;
|
|
if (bFifoBEnable) CrtFifoCount++;
|
|
if (bFifoCEnable) CrtFifoCount++;
|
|
|
|
while ((!bModePass) && (lThreshold < 16))
|
|
{
|
|
bModePass = TRUE; // assume pass until proven otherwise.
|
|
|
|
//
|
|
// Checking capture
|
|
//
|
|
if (bCapture)
|
|
{
|
|
lVCapLatency = (BLIT_LATENCY + RAS_PRECHARGE) * ppdev->lMCLKPeriod;
|
|
lVCapBytesToEmpty = CAP_FIFO_DEPTH;
|
|
lVCapEmptyTime = lVCapReadPeriod * lVCapBytesToEmpty;
|
|
lVCapLevelRemaining = (lVCapLatency + lVCapEmptyTime) / lVCapWritePeriod;
|
|
if (lVCapLevelRemaining > CAP_FIFO_DEPTH)
|
|
return(FALSE);
|
|
}
|
|
|
|
//
|
|
// Fill FIFO 1
|
|
//
|
|
if (bCapture)
|
|
lFifo1Latency = lVCapLatency + lVCapEmptyTime + (BLIT_LATENCY + RAS_PRECHARGE) * ppdev->lMCLKPeriod;
|
|
else
|
|
lFifo1Latency = (BLIT_LATENCY + RAS_PRECHARGE) * ppdev->lMCLKPeriod;
|
|
|
|
lFifo1BytesToFill = ((16 - lThreshold) * 16)
|
|
+ (lFifo1Latency / lFifo1ReadPeriod);
|
|
lFifo1FillTime = lFifo1EffWritePeriod * lFifo1BytesToFill;
|
|
if (lFifo1BytesToFill > 256)
|
|
bModePass = FALSE;
|
|
|
|
DISPDBG ((4, "After Fill FIFO1, lFifo1BytesToFillb=%ld, ModePass = %s",
|
|
lFifo1BytesToFill, bModePass ? "yes" : "no")) ;
|
|
DISPDBG ((4, "f1_latency=%ld, f1_read_period=%ld",
|
|
lFifo1Latency, lFifo1ReadPeriod)) ;
|
|
DISPDBG ((4, "mclkperiod= %ld, vclkperiod=%ld",
|
|
ppdev->lMCLKPeriod, lVCLKPeriod)) ;
|
|
|
|
//
|
|
// Fill FIFO 2
|
|
//
|
|
if (CrtFifoCount > 1)
|
|
{
|
|
lFifo2Latency = lFifo1Latency + lFifo1FillTime +
|
|
(RAS_PRECHARGE * ppdev->lMCLKPeriod);
|
|
lFifo2BytesToFill = ((16 - lThreshold) * 16) +
|
|
(lFifo2Latency / lFifo2ReadPeriod);
|
|
lFifo2FillTime = lFifo2EffWritePeriod * lFifo2BytesToFill;
|
|
if (lFifo2BytesToFill > 256)
|
|
bModePass = FALSE;
|
|
}
|
|
else
|
|
{
|
|
lFifo2Latency = lFifo1Latency + lFifo1FillTime;
|
|
lFifo2BytesToFill = 0;
|
|
lFifo2FillTime = 0;
|
|
}
|
|
|
|
DISPDBG ((4, "After Fill FIFO2, lFifo2BytesToFill=%ld, ModePass = %s",
|
|
lFifo2BytesToFill, bModePass ? "yes" : "no"));
|
|
|
|
//
|
|
// Fill FIFO 3
|
|
//
|
|
if (CrtFifoCount > 2)
|
|
{
|
|
lFifo3Latency = lFifo2Latency + lFifo2FillTime + (RAS_PRECHARGE * ppdev->lMCLKPeriod);
|
|
lFifo3BytesToFill = ((16 - lThreshold) * 16) + (lFifo3Latency / lFifo3ReadPeriod);
|
|
lFifo3FillTime = lFifo3EffWritePeriod * lFifo3BytesToFill;
|
|
if (lFifo3BytesToFill > 256)
|
|
bModePass = FALSE;
|
|
}
|
|
else
|
|
{
|
|
lFifo3Latency = lFifo2Latency + lFifo2FillTime;
|
|
lFifo3BytesToFill = 0;
|
|
lFifo3FillTime = 0;
|
|
}
|
|
|
|
DISPDBG ((4, "After Fill FIFO3, lFifo3BytesToFill=%ld, ModePass = %s",
|
|
lFifo3BytesToFill, bModePass ? "yes" : "no")) ;
|
|
|
|
//
|
|
// Determine total latency through the sequence
|
|
//
|
|
lTotalLatency = lFifo3Latency + lFifo3FillTime;
|
|
|
|
//
|
|
// Now back to start of sequence, make sure that none of the FIFOs
|
|
// have already initiated another request.
|
|
//
|
|
|
|
//
|
|
// Check capture FIFO status
|
|
//
|
|
if (bCapture)
|
|
{
|
|
lVCapLatency = lTotalLatency;
|
|
lVCapBytesToEmpty = lTotalLatency / lVCapWritePeriod;
|
|
if (lVCapBytesToEmpty > CAP_FIFO_DEPTH)
|
|
bModePass = FALSE;
|
|
}
|
|
|
|
//
|
|
// Check FIFO 1 status
|
|
//
|
|
lFifo1Latency = lTotalLatency - lFifo1Latency - lFifo1FillTime;
|
|
lFifo1BytesToFill = lFifo1Latency / lFifo1ReadPeriod;
|
|
if (lFifo1BytesToFill > ((16 - lThreshold) * 16))
|
|
bModePass = FALSE;
|
|
|
|
DISPDBG ((4, "After CheckF FIFO1, fifo1bytestofill %ld,bModePass = %s",
|
|
lFifo1BytesToFill, bModePass ? "yes" : "no")) ;
|
|
|
|
//
|
|
// Check FIFO 2 status
|
|
//
|
|
if (CrtFifoCount > 1)
|
|
{
|
|
lFifo2Latency = lTotalLatency - lFifo2Latency - lFifo2FillTime;
|
|
lFifo2BytesToFill = lFifo2Latency / lFifo2ReadPeriod;
|
|
if (lFifo2BytesToFill > ((16 - lThreshold) * 16))
|
|
bModePass = FALSE;
|
|
|
|
DISPDBG ((4, "After Check FIFO 2, fifo1bytestofill=%ld, bModePass = %s",
|
|
lFifo2BytesToFill, bModePass ? "yes" : "no")) ;
|
|
|
|
}
|
|
|
|
if (!bModePass)
|
|
lThreshold++;
|
|
|
|
}
|
|
|
|
|
|
if (bModePass)
|
|
{
|
|
|
|
DISPDBG ((1, "Is sufficient Bandwidth, thresh = %ld, return TRUE\n", lThreshold));
|
|
|
|
if (ppdev->cBitsPerPixel == 24)
|
|
lThreshold = 0x0F;
|
|
|
|
ppdev->lFifoThresh = lThreshold;
|
|
|
|
return TRUE ;
|
|
}
|
|
|
|
DISPDBG ((2, "Is sufficient Bandwidth, thresh = %ld, rerurn FALSE", lThreshold));
|
|
return FALSE;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**********************************************************
|
|
*
|
|
* Name: GetVCLK
|
|
*
|
|
* Module Abstract:
|
|
* ----------------
|
|
* Returns the VCLK frequency * 1000.
|
|
*
|
|
* Input Parameters:
|
|
* -----------------
|
|
* none
|
|
*
|
|
* Output Parameters:
|
|
* ------------------
|
|
* MCLK
|
|
*
|
|
***********************************************************
|
|
* Author: Shuhua Ge
|
|
* Date: 09/25/96
|
|
*
|
|
* Revision History:
|
|
* -----------------
|
|
* WHO WHEN WHAT/WHY/HOW
|
|
* --- ---- ------------
|
|
*
|
|
*********************************************************/
|
|
|
|
LONG GetVCLK(PDEV* ppdev)
|
|
{
|
|
LONG lTemp;
|
|
LONG lRegSR1F;
|
|
LONG lRegMISC;
|
|
LONG lNR;
|
|
LONG lDR;
|
|
LONG lPS;
|
|
BYTE* pjPorts = ppdev->pjPorts;
|
|
|
|
/*
|
|
* First read SR1F. This tells us if VCLK is derived from MCLK
|
|
* or if it's derived normally.
|
|
*/
|
|
CP_OUT_BYTE(pjPorts, SR_INDEX, 0x1f);
|
|
lRegSR1F = (LONG) CP_IN_BYTE(pjPorts, SR_DATA);
|
|
if (lRegSR1F & 0x40)
|
|
{
|
|
LONG lMCLK;
|
|
|
|
/*
|
|
* It is derived from MCLK, but now we need to read SR1E to see
|
|
* if VCLK = MCLK or if VCLK = MCLK/2.
|
|
*/
|
|
lMCLK = (lRegSR1F & 0x3F) * 14318;
|
|
CP_OUT_BYTE(pjPorts, SR_INDEX, 0x1e);
|
|
if (CP_IN_BYTE(pjPorts, SR_DATA) & 0x01)
|
|
{
|
|
return (lMCLK >> 4);
|
|
}
|
|
else
|
|
{
|
|
return (lMCLK >> 3);
|
|
}
|
|
}
|
|
else
|
|
{
|
|
/*
|
|
* Read MISC[3:2], which tells us where to find our VCLK
|
|
*/
|
|
lRegMISC = (LONG) CP_IN_BYTE(pjPorts, 0x3cc);
|
|
lRegMISC >>= 2;
|
|
|
|
//myf33 begin
|
|
CP_OUT_BYTE(pjPorts, CRTC_INDEX, (BYTE)0x80);
|
|
if (((ppdev->ulChipID == CL7555_ID) || (ppdev->ulChipID == CL7556_ID)) &&
|
|
(CP_IN_BYTE(pjPorts, CRTC_DATA) & 0x01))
|
|
lRegMISC &= 0x02; // Fixed PDR 8709
|
|
else
|
|
//myf33 end
|
|
lRegMISC &= 0x03;
|
|
|
|
lNR = 0x0B + lRegMISC;
|
|
lDR = 0x1B + lRegMISC;
|
|
|
|
/*
|
|
* Read the values for bP, bDR, and bNR
|
|
*/
|
|
CP_OUT_BYTE(pjPorts, SR_INDEX, (BYTE) lDR);
|
|
lPS = lDR = (LONG)CP_IN_BYTE(pjPorts, SR_DATA);
|
|
CP_OUT_BYTE(pjPorts, SR_INDEX, (BYTE) lNR);
|
|
lNR = (LONG)CP_IN_BYTE(pjPorts, SR_DATA);
|
|
lPS &= 0x01;
|
|
lPS += 1;
|
|
lDR >>= 1;
|
|
//
|
|
// Extended the VCLK bits.
|
|
//
|
|
// sge06
|
|
lDR &= 0x7f;
|
|
lNR &= 0x7f;
|
|
|
|
/*
|
|
* VCLK = (14.31818 * bNR) / (bDR * bPS)
|
|
*/
|
|
lTemp = (14318 * lNR);
|
|
if (!lPS || !lDR)
|
|
{
|
|
return (0);
|
|
}
|
|
lTemp /= (lDR * lPS);
|
|
}
|
|
|
|
return (lTemp);
|
|
}
|
|
/**********************************************************
|
|
*
|
|
* Name: EnableStartAddrDoubleBuffer
|
|
*
|
|
* Module Abstract:
|
|
* ----------------
|
|
* Enable the double buffering of the start addresses. This allows the page
|
|
* flipping operation to proceed without the system CPU waiting for VRT.
|
|
*
|
|
* Input Parameters:
|
|
* -----------------
|
|
* none
|
|
*
|
|
* Output Parameters:
|
|
* ------------------
|
|
*
|
|
***********************************************************
|
|
* Author: Shuhua Ge
|
|
* Date: 10/01/96
|
|
*
|
|
* Revision History:
|
|
* -----------------
|
|
* WHO WHEN WHAT/WHY/HOW
|
|
* --- ---- ------------
|
|
*
|
|
*********************************************************/
|
|
VOID EnableStartAddrDoubleBuffer(PDEV* ppdev)
|
|
{
|
|
|
|
BYTE* pjPorts = ppdev->pjPorts;
|
|
BYTE cTemp;
|
|
|
|
|
|
CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x1a);
|
|
cTemp = CP_IN_BYTE(pjPorts, CRTC_DATA);
|
|
CP_OUT_BYTE(pjPorts, CRTC_DATA, cTemp | 2);
|
|
}
|
|
|
|
/**********************************************************
|
|
*
|
|
* Name: GetCurrentVLine
|
|
*
|
|
* Module Abstract:
|
|
* ----------------
|
|
* Get the current scan line
|
|
*
|
|
* Input Parameters:
|
|
* -----------------
|
|
* none
|
|
*
|
|
* Output Parameters:
|
|
* ------------------
|
|
*
|
|
***********************************************************
|
|
* Author: Shuhua Ge
|
|
* Date: 10/01/96
|
|
*
|
|
* Revision History:
|
|
* -----------------
|
|
* WHO WHEN WHAT/WHY/HOW
|
|
* --- ---- ------------
|
|
*
|
|
*********************************************************/
|
|
DWORD GetCurrentVLine(PDEV* ppdev)
|
|
{
|
|
|
|
DWORD dwLine;
|
|
BYTE cTemp;
|
|
BYTE* pjPorts = ppdev->pjPorts;
|
|
|
|
CP_OUT_BYTE(pjPorts, INDEX_REG, 0x16); /* Index to the low byte. */
|
|
dwLine = (ULONG)CP_IN_BYTE(pjPorts, DATA_REG);
|
|
|
|
CP_OUT_BYTE(pjPorts, INDEX_REG, 0x17); /* Index to the high bits. */
|
|
cTemp = CP_IN_BYTE(pjPorts, DATA_REG);
|
|
dwLine |= (cTemp & 3) << 8;
|
|
|
|
CP_OUT_BYTE(pjPorts, INDEX_REG, 0x16); /* Index to the low byte. */
|
|
|
|
/* If we wrapped around while getting the high bits we have a problem. */
|
|
/* The high bits may be wrong. */
|
|
if((CP_IN_BYTE(pjPorts, DATA_REG)) < (dwLine & 0xff))
|
|
{
|
|
DISPDBG((1, "Recursive call to GetCurrentVLine."));
|
|
return GetCurrentVLine(ppdev);
|
|
}
|
|
if (dwLine > ppdev->dwVsyncLine)
|
|
{
|
|
return 0;
|
|
}
|
|
return dwLine;
|
|
}
|
|
#endif
|
|
|
|
#endif // DIRECTDRAW
|