/******************************************************************************\ * * Copyright (c) 1996-1997 Microsoft Corporation. * Copyright (c) 1996-1997 Cirrus Logic, Inc. * * Module Name: * * D D R A W . C * * * Implements all the DirectDraw components for the driver. * * * $Log: S:/projects/drivers/ntsrc/display/ddraw.c_v $ * * Rev 1.14 07 Apr 1997 11:37:02 PLCHU * * * Rev 1.13 Apr 03 1997 15:38:44 unknown * * * * Rev 1.10 Jan 14 1997 15:15:12 unknown * Add new double clock detecting method. * * Rev 1.8 Jan 08 1997 11:23:34 unknown * Add 2x clock support and double scan line counter support * * Rev 1.7 Dec 17 1996 18:31:12 unknown * Update the bandwidth equation again. * * Rev 1.6 Dec 13 1996 12:15:04 unknown * update bandwith equation. * * Rev 1.5 Dec 12 1996 11:09:52 unknown * Add double scan line counter support * * Rev 1.5 Dec 12 1996 11:02:12 unknown * Add double scan line counter support. * * Rev 1.5 Nov 26 1996 14:29:58 unknown * Turn off the video window before the moving and then turn it on. * * Rev 1.4 Nov 25 1996 14:39:32 unknown * Fixed AVI file playback and 16bpp transparent Blt bugs. * * Rev 1.4 Nov 18 1996 13:58:58 JACKIEC * * * Rev 1.3 Nov 07 1996 16:47:56 unknown * * * Rev 1.2 Oct 16 1996 14:41:04 unknown * NT 3.51 does not have DDRAW support, So turn off overlay.h in NT 3.51 * * Rev 1.1 Oct 10 1996 15:36:28 unknown * * * Rev 1.10 12 Aug 1996 16:51:04 frido * Added NT 3.5x/4.0 auto detection. * * Rev 1.9 06 Aug 1996 18:37:12 frido * DirectDraw works! Video mapping is the key! * * Rev 1.8 24 Jul 1996 14:38:44 frido * Cleaned up font cache after DirectDraw is done. * * Rev 1.7 24 Jul 1996 14:30:04 frido * Added a call to destroy all cached fonts to make more room. * * Rev 1.6 20 Jul 1996 00:00:44 frido * Fixed filling of DirectDraw in 24-bpp. * Changed off-screen alignment to 4 bytes. * Added compile switch to manage DirectDraw support in 24-bpp. * * Rev 1.5 16 Jul 1996 18:55:22 frido * Fixed DirectDraw in 24-bpp mode. * * Rev 1.4 15 Jul 1996 18:03:22 frido * Changed CP_MM_DST_ADDR to CP_MM_DST_ADDR_ABS. * * Rev 1.3 15 Jul 1996 10:58:28 frido * Changed back to S3 base. * * Rev 1.1 09 Jul 1996 14:52:30 frido * Only support chips 5436 and 5446. * * Rev 1.0 03 Jul 1996 13:53:02 frido * Ported from S3 DirectDraw code. * * jl01 10-08-96 Do Transparent BLT w/o Solid Fill. Refer to PDRs#5511/6817. * * chu01 11-17-96 For 24-bpp, aligned destination boundary/size values are * wrong. Refer to PDR#7312. * * sge01 11-19-96 Write CR37 at last For 5480. * * * sge02 11-21-96 We have to set the Color Expand Width even in * non-expand transparency mode. * * * sge03 12-04-96 Add double scan line counter support . * * sge04 12-13-96 Change bandwidth for 5446BE and later chips. * * sge05 01-07-97 Use dword align for double clock mode. * * chu02 01-08-97 Disable ActiveX/Active Movie Player for interlaced modes. * Refer to PDR#7312, 7866. * * jc01 10-18-96 Port Microsoft recent change. * tao1 10-21-96 Added direct draw support for CL-GD7555. * myf21 11-21-96 Change CAPS_IS_7555 to check ppdev->ulChipID * * sge06 01-27-97 Extend VCLK Denominator to 7 bits from 5 bits. * sge07 02-13-97 Use replication when in 1280x1024x8 mode. * myf31 02-24-97 Fixed enable HW Video, panning scrolling enable,screen move * video window have follow moving * chu03 03-26-97 Bandwidth eqution for the CL-GD5480. * myf33 :03-31-97 : Fixed PDR #8709, read true VCLK in getVCLK() * & panning scrolling enable, support HW Video * chu04 04-02-97 No matterwhat color depth is, always turn on COLORKEY and * SRCBLT in the DD/DD colorkey capabilities for the 5480. * \******************************************************************************/ #include "PreComp.h" #if DIRECTDRAW #include "overlay.h" LONG MIN_OLAY_WIDTH = 4; //#define ONLY54x6 // Comment this line out if DirectDraw should be 'generic' // The next flag controls DirectDraw support in 24-bpp. #define DIRECTX_24 2 // 0 - no support // 1 - blt support, no heap (flip) // 2 - full support // // Some handy macros. // #define BLT_BUSY(ppdev, pjBase) (CP_MM_ACL_STAT(ppdev, pjBase) & 0x01) #ifdef ONLY54x6 #define BLT_READY(ppdev, pjBase) (!(CP_MM_ACL_STAT(ppdev, pjBase) & 0x10)) #else #define BLT_READY(ppdev, pjBase) (!(CP_MM_ACL_STAT(ppdev, pjBase) & \ ((ppdev->flCaps & CAPS_AUTOSTART) ? 0x10 : 0x01))) #endif #define NUM_VBLANKS_TO_MEASURE 1 #define NUM_MEASUREMENTS_TO_TAKE 8 /******************************Public*Routine******************************\ * * DWORD dwGetPaletteEntry * \**************************************************************************/ DWORD dwGetPaletteEntry( PDEV* ppdev, DWORD iIndex) { BYTE* pjPorts; DWORD dwRed; DWORD dwGreen; DWORD dwBlue; pjPorts = ppdev->pjPorts; CP_OUT_BYTE(pjPorts, DAC_PEL_READ_ADDR, iIndex); dwRed = CP_IN_BYTE(pjPorts, DAC_PEL_DATA); dwGreen = CP_IN_BYTE(pjPorts, DAC_PEL_DATA); dwBlue = CP_IN_BYTE(pjPorts, DAC_PEL_DATA); return((dwRed << 16) | (dwGreen << 8) | (dwBlue)); } /******************************Public*Routine******************************\ * VOID vGetDisplayDuration * * Get the length, in EngQueryPerformanceCounter() ticks, of a refresh cycle. * * If we could trust the miniport to return back and accurate value for * the refresh rate, we could use that. Unfortunately, our miniport doesn't * ensure that it's an accurate value. * \**************************************************************************/ VOID vGetDisplayDuration( PDEV* ppdev) { BYTE* pjPorts; DWORD dwTemp; LONG i, j; LONGLONG li; LONGLONG liMin; LONGLONG aliMeasurement[NUM_MEASUREMENTS_TO_TAKE + 1]; pjPorts = ppdev->pjPorts; memset(&ppdev->flipRecord, 0, sizeof(ppdev->flipRecord)); // Warm up EngQUeryPerformanceCounter to make sure it's in the working set. EngQueryPerformanceCounter(&li); // Unfortunately, since NT is a proper multitasking system, we can't just // disable interrupts to take an accurate reading. We also can't do anything // so goofy as dynamically change our thread's priority to real-time. // // So we just do a bunch of short measurements and take the minimum. // // It would be 'okay' if we got a result that's longer than the actual // VBlank cycle time -- nothing bad would happen except that the app would // run a little slower. We don't want to get a result that's shorter than // the actual VBlank cycle time -- that could cause us to start drawing over // a frame before the Flip has occured. while (CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE) ; while (!(CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE)) ; for (i = 0; i < NUM_MEASUREMENTS_TO_TAKE; i++) { // We're at the start of the VBlank active cycle! EngQueryPerformanceCounter(&aliMeasurement[i]); // Okay, so life in a multi-tasking environment isn't all that simple. // What if we had taken a context switch just before the above // EngQueryPerformanceCounter call, and now were half way through the // VBlank inactive cycle? Then we would measure only half a VBlank // cycle, which is obviously bad. The worst thing we can do is get a // time shorter than the actual VBlank cycle time. // // So we solve this by making sure we're in the VBlank active time // before and after we query the time. If it's not, we'll sync up to the // next VBlank (it's okay to measure this period -- it will be // guaranteed to be longer than the VBlank cycle and will likely be // thrown out when we select the minimum sample). There's a chance that // we'll take a context switch and return just before the end of the // active VBlank time -- meaning that the actual measured time would be // less than the true amount -- but since the VBlank is active less than // 1% of the time, this means that we would have a maximum of 1% error // approximately 1% of the times we take a context switch. An acceptable // risk. // // This next line will cause us wait if we're no longer in the VBlank // active cycle as we should be at this point. while (!(CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE)) ; for (j = 0; j < NUM_VBLANKS_TO_MEASURE; j++) { while (CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE) ; while (!(CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE)) ; } } EngQueryPerformanceCounter(&aliMeasurement[NUM_MEASUREMENTS_TO_TAKE]); // Use the minimum. liMin = aliMeasurement[1] - aliMeasurement[0]; DISPDBG((2, "Refresh count: %li - %li", 1, (ULONG) liMin)); for (i = 2; i <= NUM_MEASUREMENTS_TO_TAKE; i++) { li = aliMeasurement[i] - aliMeasurement[i - 1]; DISPDBG((2, " %li - %li", i, (ULONG) li)); if (li < liMin) { liMin = li; } } // Round the result: ppdev->flipRecord.liFlipDuration = (DWORD) (liMin + (NUM_VBLANKS_TO_MEASURE / 2)) / NUM_VBLANKS_TO_MEASURE; DISPDBG((2, "Frequency %li.%03li Hz", (ULONG) (EngQueryPerformanceFrequency(&li), li / ppdev->flipRecord.liFlipDuration), (ULONG) (EngQueryPerformanceFrequency(&li), ((li * 1000) / ppdev->flipRecord.liFlipDuration) % 1000))); ppdev->flipRecord.liFlipTime = aliMeasurement[NUM_MEASUREMENTS_TO_TAKE]; ppdev->flipRecord.bFlipFlag = FALSE; ppdev->flipRecord.fpFlipFrom = 0; // sge // Get the line on which the VSYNC occurs CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x7); dwTemp = (DWORD)CP_IN_BYTE(pjPorts, CRTC_DATA); ppdev->dwVsyncLine = ((dwTemp & 0x80) << 2); ppdev->dwVsyncLine |= ((dwTemp & 0x04) << 6); CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x10); ppdev->dwVsyncLine |= CP_IN_BYTE(pjPorts, CRTC_DATA); } /******************************Public*Routine******************************\ * HRESULT dwUpdateFlipStatus * * Checks and sees if the most recent flip has occurred. * \**************************************************************************/ HRESULT UpdateFlipStatus(PDEV* ppdev, FLATPTR fpVidMem) { BYTE* pjPorts; LONGLONG liTime; pjPorts = ppdev->pjPorts; if ((ppdev->flipRecord.bFlipFlag) && //#jc01 ((fpVidMem == 0) || (fpVidMem == ppdev->flipRecord.fpFlipFrom))) ((fpVidMem == 0xffffffff) || (fpVidMem == ppdev->flipRecord.fpFlipFrom))) //#jc01 { #if 0 // sge use scanline if (CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE) { if (ppdev->flipRecord.bWasEverInDisplay) { ppdev->flipRecord.bHaveEverCrossedVBlank = TRUE; } } else if (!(CP_IN_BYTE(pjPorts, STATUS_1) & DISPLAY_MODE_INACTIVE)) { if( ppdev->flipRecord.bHaveEverCrossedVBlank ) { ppdev->flipRecord.bFlipFlag = FALSE; return(DD_OK); } ppdev->flipRecord.bWasEverInDisplay = TRUE; } EngQueryPerformanceCounter(&liTime); if (liTime - ppdev->flipRecord.liFlipTime <= ppdev->flipRecord.liFlipDuration) { return(DDERR_WASSTILLDRAWING); } #else /* * if we aren't in the vertical retrace, we can use the scanline * to help decide on what to do */ if( !(CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE) ) { if( ppdev->flipRecord.bHaveEverCrossedVBlank == FALSE ) { ppdev->flipRecord.bWasEverInDisplay = TRUE; if( GetCurrentVLine(ppdev) >= ppdev->flipRecord.dwFlipScanLine ) { EngQueryPerformanceCounter(&liTime); if (liTime - ppdev->flipRecord.liFlipTime <= ppdev->flipRecord.liFlipDuration) { return(DDERR_WASSTILLDRAWING); } } } } /* * in the vertical retrace, scanline is useless */ else { if( ppdev->flipRecord.bWasEverInDisplay ) { ppdev->flipRecord.bHaveEverCrossedVBlank = TRUE; // return DD_OK; } EngQueryPerformanceCounter(&liTime); if (liTime - ppdev->flipRecord.liFlipTime <= ppdev->flipRecord.liFlipDuration) { return(DDERR_WASSTILLDRAWING); } } #endif // endif use scanline ppdev->flipRecord.bFlipFlag = FALSE; } return(DD_OK); } /******************************Public*Routine******************************\ * DWORD DdBlt * \**************************************************************************/ DWORD DdBlt( PDD_BLTDATA lpBlt) { PDD_SURFACE_GLOBAL srcSurf; PDD_SURFACE_GLOBAL dstSurf; PDEV* ppdev; BYTE* pjBase; DWORD dstOffset; DWORD dstPitch; DWORD dstX, dstY; DWORD dwFlags; DWORD width, height; DWORD srcOffset; DWORD srcPitch; DWORD srcX, srcY; ULONG ulBltCmd; DWORD xExt, yExt; DWORD xDiff, yDiff; ppdev = lpBlt->lpDD->dhpdev; pjBase = ppdev->pjBase; dstSurf = lpBlt->lpDDDestSurface->lpGbl; // Is a flip in progress? if (UpdateFlipStatus(ppdev, dstSurf->fpVidMem) != DD_OK) { lpBlt->ddRVal = DDERR_WASSTILLDRAWING; return(DDHAL_DRIVER_HANDLED); } dwFlags = lpBlt->dwFlags; if (dwFlags & DDBLT_ASYNC) { // If async, then only work if we won't have to wait on the accelerator // to start the command. if (!BLT_READY(ppdev, pjBase)) { lpBlt->ddRVal = DDERR_WASSTILLDRAWING; return(DDHAL_DRIVER_HANDLED); } } DISPDBG((2, "DdBlt Entered")); // Calculate destination parameters. dstX = lpBlt->rDest.left; dstY = lpBlt->rDest.top; width = PELS_TO_BYTES(lpBlt->rDest.right - dstX) - 1; height = (lpBlt->rDest.bottom - dstY) - 1; dstPitch = dstSurf->lPitch; dstOffset = (DWORD)(dstSurf->fpVidMem + PELS_TO_BYTES(dstX) + (dstY * dstPitch)); // Color fill? if (dwFlags & DDBLT_COLORFILL) { ULONG ulBltMode = ENABLE_COLOR_EXPAND | ENABLE_8x8_PATTERN_COPY | ppdev->jModeColor; // Wait for the accelerator. while (!BLT_READY(ppdev, pjBase)) ; // Program bitblt engine. CP_MM_ROP(ppdev, pjBase, HW_P); CP_MM_DST_Y_OFFSET(ppdev, pjBase, dstPitch); CP_MM_BLT_MODE(ppdev, pjBase, ulBltMode); CP_MM_FG_COLOR(ppdev, pjBase, lpBlt->bltFX.dwFillColor); if (ppdev->flCaps & CAPS_AUTOSTART) { CP_MM_BLT_EXT_MODE(ppdev, pjBase, ENABLE_SOLID_FILL); } else { CP_MM_SRC_ADDR(ppdev, pjBase, ppdev->ulSolidColorOffset); } CP_MM_XCNT(ppdev, pjBase, width); CP_MM_YCNT(ppdev, pjBase, height); CP_MM_DST_ADDR_ABS(ppdev, pjBase, dstOffset); CP_MM_START_BLT(ppdev, pjBase); lpBlt->ddRVal = DD_OK; return(DDHAL_DRIVER_HANDLED); } // We specified with Our ddCaps.dwCaps that we handle a limited number of // commands, and by this point in our routine we've handled everything // except DDBLT_ROP. DirectDraw and GDI shouldn't pass us anything else; // we'll assert on debug builds to prove this. ASSERTDD((dwFlags & DDBLT_ROP) && (lpBlt->lpDDSrcSurface), "Expected dwFlags commands of only DDBLT_ASYNC and DDBLT_COLORFILL"); // Get offset, width, and height for source. srcSurf = lpBlt->lpDDSrcSurface->lpGbl; srcX = lpBlt->rSrc.left; srcY = lpBlt->rSrc.top; srcPitch = srcSurf->lPitch; srcOffset = (DWORD)(srcSurf->fpVidMem + PELS_TO_BYTES(srcX) + (srcY * srcPitch)); /* * Account for PackJR. If the start and the width are not 4 pixel * aligned, we need to BLT this by hand. Otherwsie, if they think * they are BLTing 16 bit data, we must adjust the parameters now. * * This is also a good place to check that YUV BLTs are 2 pixel * aligned. */ if (lpBlt->lpDDDestSurface->dwReserved1 & (OVERLAY_FLG_PACKJR | OVERLAY_FLG_YUV422)) { ASSERTDD(0, "Who will get here?"); #if 0 // software blt /* * Check YUV first. We can fail this if incorrect because the client * should know better (since they are explicitly use YUV). */ if ((lpBlt->lpDDDestSurface->dwReserved1 & OVERLAY_FLG_YUV422) && ((lpBlt->rSrc.left & 0x01) != (lpBlt->rDest.left & 0x01))) { lpBlt->ddRVal = DDERR_XALIGN; return (DDHAL_DRIVER_HANDLED); } /* * If PackJR is wrong, we must make this work ourselves because we * may be converting to this w/o the client knowing. */ else if (lpBlt->lpDDDestSurface->dwReserved1 & OVERLAY_FLG_PACKJR) { if (dwFlags & DDBLT_COLORFILL) { lpBlt->ddRVal = DDERR_XALIGN; return (DDHAL_DRIVER_HANDLED); } if ((lpBlt->rSrc.left & 0x03) || (lpBlt->rDest.left & 0x03)) { /* * The start doesn't align - we have to do this the slow way */ PackJRBltAlign ((LPBYTE) ppdev->pjScreen + srcOffset, (LPBYTE) ppdev->pjScreen + dstOffset, lpBlt->rDest.right - lpBlt->rDest.left, lpBlt->rDest.bottom - lpBlt->rDest.top, srcPitch, dstPitch); lpBlt->ddRVal = DD_OK; return (DDHAL_DRIVER_HANDLED); } else if (lpBlt->rSrc.right & 0x03) { /* * The end doesn't align - we will do the BLT as normal, but * write the last pixels the slow way */ if (lpBlt->lpDDDestSurface->dwReserved1 & (OVERLAY_FLG_CONVERT_PACKJR | OVERLAY_FLG_MUST_RASTER)) { srcPitch >>= 1; srcOffset = srcSurf->fpVidMem + PELS_TO_BYTES(srcX) + (srcY * srcPitch); dstPitch >>= 1; dstOffset = dstSurf->fpVidMem + PELS_TO_BYTES(dstX) + (dstY * dstPitch); } width = ((WORD)lpBlt->rSrc.right & ~0x03) - (WORD)lpBlt->rSrc.left; PackJRBltAlignEnd ((LPBYTE) ppdev->pjScreen + srcOffset + width, (LPBYTE) ppdev->pjScreen + dstOffset + width, lpBlt->rSrc.right & 0x03, lpBlt->rDest.bottom - lpBlt->rDest.top, srcPitch, dstPitch); } else if (lpBlt->lpDDDestSurface->dwReserved1 & (OVERLAY_FLG_CONVERT_PACKJR | OVERLAY_FLG_MUST_RASTER)) { /* * Everything aligns, but we have to re-calculate the start * address and the pitch. */ srcPitch >>= 1; srcOffset = srcSurf->fpVidMem + PELS_TO_BYTES(srcX) + (srcY * srcPitch); dstPitch >>= 1; dstOffset = dstSurf->fpVidMem + PELS_TO_BYTES(dstX) + (dstY * dstPitch); width >>= 1; } } #endif } if ((dstSurf == srcSurf) && (srcOffset < dstOffset)) { // Okay, we have to do the blt bottom-to-top, right-to-left. ulBltCmd = DIR_BTRL; ; srcOffset += width + (srcPitch * height); dstOffset += width + (dstPitch * height); } else { // Okay, we have to do the blt top-to-bottom, left-to-right. ulBltCmd = DIR_TBLR; } // Wait for the accelerator. while (!BLT_READY(ppdev, pjBase)) ; // // What about source color key // ASSERTDD((!(dwFlags & DDBLT_KEYSRC)), "Do not expected source color key"); if (dwFlags & DDBLT_KEYSRCOVERRIDE) { ULONG ulColor; // // sge02 // ulBltCmd |= ENABLE_TRANSPARENCY_COMPARE | ppdev->jModeColor; ulColor = lpBlt->bltFX.ddckSrcColorkey.dwColorSpaceLowValue; if (ppdev->cBpp == 1) { ulColor |= ulColor << 8; } CP_WRITE_USHORT(pjBase, MM_BLT_COLOR_KEY, ulColor); } if ( (ulBltCmd & DIR_BTRL) && (ulBltCmd & ENABLE_TRANSPARENCY_COMPARE) && (ppdev->cBpp > 1) ) { ulBltCmd &= ~DIR_BTRL; xExt = lpBlt->rDest.right - lpBlt->rDest.left; yExt = lpBlt->rDest.bottom - lpBlt->rDest.top; xDiff = dstX - srcX; yDiff = dstY - srcY; if (yDiff == 0) { srcOffset -= srcPitch * height - 1; dstOffset -= dstPitch * height - 1; while (xExt) { width = PELS_TO_BYTES(min(xDiff, xExt)); srcOffset -= width; dstOffset -= width; while (!BLT_READY(ppdev, pjBase)) ; CP_MM_ROP(ppdev, pjBase, CL_SRC_COPY); CP_MM_BLT_MODE(ppdev, pjBase, ulBltCmd); CP_MM_BLT_EXT_MODE(ppdev, pjBase, 0); CP_MM_SRC_Y_OFFSET(ppdev, pjBase, srcPitch); CP_MM_DST_Y_OFFSET(ppdev, pjBase, dstPitch); CP_MM_XCNT(ppdev, pjBase, width - 1); CP_MM_YCNT(ppdev, pjBase, height); CP_MM_SRC_ADDR(ppdev, pjBase, srcOffset); CP_MM_DST_ADDR_ABS(ppdev, pjBase, dstOffset); CP_MM_START_BLT(ppdev, pjBase); xExt -= min(xDiff, xExt); } } else { srcOffset -= width - srcPitch; dstOffset -= width - dstPitch; while (yExt) { height = min(yDiff, yExt); srcOffset -= height * srcPitch; dstOffset -= height * dstPitch; while (!BLT_READY(ppdev, pjBase)) ; CP_MM_ROP(ppdev, pjBase, CL_SRC_COPY); CP_MM_BLT_MODE(ppdev, pjBase, ulBltCmd); CP_MM_BLT_EXT_MODE(ppdev, pjBase, 0); CP_MM_SRC_Y_OFFSET(ppdev, pjBase, srcPitch); CP_MM_DST_Y_OFFSET(ppdev, pjBase, dstPitch); CP_MM_XCNT(ppdev, pjBase, width); CP_MM_YCNT(ppdev, pjBase, height - 1); CP_MM_SRC_ADDR(ppdev, pjBase, srcOffset); CP_MM_DST_ADDR_ABS(ppdev, pjBase, dstOffset); CP_MM_START_BLT(ppdev, pjBase); yExt -= min(yDiff, yExt); } } } else { CP_MM_ROP(ppdev, pjBase, CL_SRC_COPY); CP_MM_BLT_MODE(ppdev, pjBase, ulBltCmd); CP_MM_BLT_EXT_MODE(ppdev, pjBase, 0); // jl01 CP_MM_SRC_Y_OFFSET(ppdev, pjBase, srcPitch); CP_MM_DST_Y_OFFSET(ppdev, pjBase, dstPitch); CP_MM_XCNT(ppdev, pjBase, width); CP_MM_YCNT(ppdev, pjBase, height); CP_MM_SRC_ADDR(ppdev, pjBase, srcOffset); CP_MM_DST_ADDR_ABS(ppdev, pjBase, dstOffset); CP_MM_START_BLT(ppdev, pjBase); } lpBlt->ddRVal = DD_OK; return(DDHAL_DRIVER_HANDLED); } /******************************Public*Routine******************************\ * DWORD DdFlip * \**************************************************************************/ DWORD DdFlip( PDD_FLIPDATA lpFlip) { PDEV* ppdev; BYTE* pjPorts; ULONG ulMemoryOffset; ULONG ulLowOffset; ULONG ulMiddleOffset; ULONG ulHighOffset1, ulHighOffset2; ppdev = lpFlip->lpDD->dhpdev; pjPorts = ppdev->pjPorts; DISPDBG((2, "DdFlip: %d x %d at %08x(%d, %d) Pitch=%d", lpFlip->lpSurfTarg->lpGbl->wWidth, lpFlip->lpSurfTarg->lpGbl->wHeight, lpFlip->lpSurfTarg->lpGbl->fpVidMem, lpFlip->lpSurfTarg->lpGbl->xHint, lpFlip->lpSurfTarg->lpGbl->yHint, lpFlip->lpSurfTarg->lpGbl->lPitch)); // Is the current flip still in progress? // // Don't want a flip to work until after the last flip is done, so we ask // for the general flip status and ignore the vmem. //#jc01 if ((UpdateFlipStatus(ppdev, 0) != DD_OK) || if ((UpdateFlipStatus(ppdev, 0xffffffff) != DD_OK) || /* #jc01 */ (BLT_BUSY(ppdev, ppdev->pjBase))) { lpFlip->ddRVal = DDERR_WASSTILLDRAWING; return(DDHAL_DRIVER_HANDLED); } ulMemoryOffset = (ULONG)(lpFlip->lpSurfTarg->lpGbl->fpVidMem); // Make sure that the border/blanking period isn't active; wait if it is. We // could return DDERR_WASSTILLDRAWING in this case, but that will increase // the odds that we can't flip the next time. while (CP_IN_BYTE(pjPorts, STATUS_1) & DISPLAY_MODE_INACTIVE) ; DISPDBG((2, "DdFlip Entered")); #if 1 // OVERLAY #sge if (lpFlip->lpSurfCurr->ddsCaps.dwCaps & DDSCAPS_OVERLAY) { DWORD dwOffset; BYTE bRegCR3A; BYTE bRegCR3B; BYTE bRegCR3C; // Make sure that the overlay surface we're flipping from is // currently visible. If you don't do this check, you'll get // really weird results when someone starts up two ActiveMovie // or DirectVideo movies simultaneously! if (lpFlip->lpSurfCurr->lpGbl->fpVidMem == ppdev->fpVisibleOverlay) { ppdev->fpVisibleOverlay = ulMemoryOffset; /* * Determine the offset to the new area. */ // dwOffset = ((ulMemoryOffset - (ULONG)ppdev->pjScreen) + ppdev->sOverlay1.lAdjustSource) >> 2; // sss dwOffset = ((ulMemoryOffset + ppdev->sOverlay1.lAdjustSource) >> 2); /* * Flip the overlay surface by changing CR3A, CR3B, and CR3C */ bRegCR3A = (BYTE) dwOffset & 0xfe; // Align on word boundary (5446 bug) dwOffset >>= 8; bRegCR3B = (BYTE) dwOffset; dwOffset >>= 8; bRegCR3C = (BYTE) (dwOffset & 0x0f); // if(GetOverlayFlipStatus(0) != DD_OK || DRAW_ENGINE_BUSY || IN_VBLANK) // { // lpFlipData->ddRVal = DDERR_WASSTILLDRAWING; // return DDHAL_DRIVER_HANDLED; // } CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x3C); CP_OUT_BYTE(pjPorts, CRTC_DATA, (CP_IN_BYTE(pjPorts, CRTC_DATA) & 0xf0) | bRegCR3C); CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD)bRegCR3A << 8) | 0x3A); CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD)bRegCR3B << 8) | 0x3B); } else { lpFlip->ddRVal = DDERR_OUTOFCAPS; return(DDHAL_DRIVER_HANDLED); } } else #endif // OVERLAY { // Do the flip. ulMemoryOffset >>= 2; ulLowOffset = 0x0D | ((ulMemoryOffset & 0x0000FF) << 8); ulMiddleOffset = 0x0C | ((ulMemoryOffset & 0x00FF00)); ulHighOffset1 = 0x1B | ((ulMemoryOffset & 0x010000) >> 8) | ((ulMemoryOffset & 0x060000) >> 7) | ppdev->ulCR1B; ulHighOffset2 = 0x1D | ((ulMemoryOffset & 0x080000) >> 4) | ppdev->ulCR1D; // Too bad that the Cirrus flip can't be done in a single atomic register // write; as it is, we stand a small chance of being context-switched out // and exactly hitting the vertical blank in the middle of doing these outs, // possibly causing the screen to momentarily jump. // // There are some hoops we could jump through to minimize the chances of // this happening; we could try to align the flip buffer such that the minor // registers are ensured to be identical for either flip position, ans so // that only the high address need be written, an obviously atomic // operation. // // However, I'm simply not going to worry about it. CP_OUT_WORD(pjPorts, CRTC_INDEX, ulHighOffset2); CP_OUT_WORD(pjPorts, CRTC_INDEX, ulHighOffset1); CP_OUT_WORD(pjPorts, CRTC_INDEX, ulMiddleOffset); CP_OUT_WORD(pjPorts, CRTC_INDEX, ulLowOffset); } // Remember where and when we were when we did the flip. EngQueryPerformanceCounter(&ppdev->flipRecord.liFlipTime); ppdev->flipRecord.bFlipFlag = TRUE; ppdev->flipRecord.bHaveEverCrossedVBlank = FALSE; ppdev->flipRecord.fpFlipFrom = lpFlip->lpSurfCurr->lpGbl->fpVidMem; if((CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE)) { ppdev->flipRecord.dwFlipScanLine = 0; ppdev->flipRecord.bWasEverInDisplay = FALSE; } else { ppdev->flipRecord.dwFlipScanLine = GetCurrentVLine(ppdev); ppdev->flipRecord.bWasEverInDisplay = TRUE; } lpFlip->ddRVal = DD_OK; return(DDHAL_DRIVER_HANDLED); } /******************************Public*Routine******************************\ * DWORD DdLock * \**************************************************************************/ DWORD DdLock(PDD_LOCKDATA lpLock) { PDEV* ppdev = lpLock->lpDD->dhpdev; BYTE* pjPorts = ppdev->pjPorts; // Check to see if any pending physical flip has occurred. Don't allow a // lock if a blt is in progress. if (UpdateFlipStatus(ppdev, lpLock->lpDDSurface->lpGbl->fpVidMem) != DD_OK) { lpLock->ddRVal = DDERR_WASSTILLDRAWING; return(DDHAL_DRIVER_HANDLED); } if (lpLock->dwFlags & DDLOCK_WAIT) { CP_MM_WAIT_FOR_BLT_COMPLETE(ppdev, ppdev->pjBase); } if (BLT_BUSY(ppdev, ppdev->pjBase)) { lpLock->ddRVal = DDERR_WASSTILLDRAWING; return(DDHAL_DRIVER_HANDLED); } /* * Force them to use the video apperture */ if ((lpLock->lpDDSurface->dwReserved1 & OVERLAY_FLG_OVERLAY) && (lpLock->dwFlags == DDLOCK_SURFACEMEMORYPTR) && (ppdev->fpBaseOverlay != 0xffffffff)) { if (lpLock->lpDDSurface->dwReserved1 & OVERLAY_FLG_DECIMATE) { /* * Turn on decimation */ CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x3f); CP_OUT_BYTE(pjPorts, CRTC_DATA, CP_IN_BYTE(pjPorts, CRTC_DATA) | 0x10); } if( lpLock->lpDDSurface->lpGbl->ddpfSurface.dwFourCC == FOURCC_YUY2) lpLock->lpSurfData = (LPVOID)(ppdev->fpBaseOverlay + lpLock->lpDDSurface->lpGbl->fpVidMem + 0x400000); else lpLock->lpSurfData = (LPVOID)(ppdev->fpBaseOverlay + lpLock->lpDDSurface->lpGbl->fpVidMem + 0x400000 * 3); // When a driver returns DD_OK and DDHAL_DRIVER_HANDLED from DdLock, // DirectDraw expects it to have adjusted the resulting pointer // to point to the upper left corner of the specified rectangle, if // any: if (lpLock->bHasRect) { lpLock->lpSurfData = (VOID*) ((BYTE*) lpLock->lpSurfData + lpLock->rArea.top * lpLock->lpDDSurface->lpGbl->lPitch + lpLock->rArea.left * (lpLock->lpDDSurface->lpGbl->ddpfSurface.dwYUVBitCount >> 3)); } lpLock->ddRVal = DD_OK; return(DDHAL_DRIVER_HANDLED); } return(DDHAL_DRIVER_NOTHANDLED); } /******************************Public*Routine******************************\ * DWORD DdUnlock * \**************************************************************************/ DWORD DdUnlock(PDD_UNLOCKDATA lpUnlock) { PDEV* ppdev = lpUnlock->lpDD->dhpdev; BYTE* pjPorts = ppdev->pjPorts; if ((lpUnlock->lpDDSurface->dwReserved1 & OVERLAY_FLG_YUVPLANAR) && !(lpUnlock->lpDDSurface->dwReserved1 & OVERLAY_FLG_ENABLED)) { CP_OUT_WORD(pjPorts, CRTC_INDEX, (0x00 << 8) | 0x3f); // Turn off YUV Planar } else if (lpUnlock->lpDDSurface->dwReserved1 & OVERLAY_FLG_DECIMATE) { CP_OUT_WORD(pjPorts, CRTC_INDEX, (0x00 << 8) | 0x3f); // Turn off YUV Planar } return(DDHAL_DRIVER_NOTHANDLED); } /******************************Public*Routine******************************\ * DWORD DdGetBltStatus * * Doesn't currently really care what surface is specified, just checks * and goes. * \**************************************************************************/ DWORD DdGetBltStatus(PDD_GETBLTSTATUSDATA lpGetBltStatus) { PDEV* ppdev; HRESULT ddRVal; PBYTE pjBase; ppdev = lpGetBltStatus->lpDD->dhpdev; pjBase = ppdev->pjBase; ddRVal = DD_OK; if (lpGetBltStatus->dwFlags == DDGBS_CANBLT) { // DDGBS_CANBLT case: can we add a blt? ddRVal = UpdateFlipStatus(ppdev, lpGetBltStatus->lpDDSurface->lpGbl->fpVidMem); if (ddRVal == DD_OK) { // There was no flip going on, so can the blitter accept new // register writes? if (!BLT_READY(ppdev, pjBase)) { ddRVal = DDERR_WASSTILLDRAWING; } } } else { // DDGBS_ISBLTDONE case: is a blt in progress? if (BLT_BUSY(ppdev, pjBase)) { ddRVal = DDERR_WASSTILLDRAWING; } } lpGetBltStatus->ddRVal = ddRVal; return(DDHAL_DRIVER_HANDLED); } /******************************Public*Routine******************************\ * DWORD DdMapMemory * * This is a new DDI call specific to Windows NT that is used to map * or unmap all the application modifiable portions of the frame buffer * into the specified process's address space. * \**************************************************************************/ DWORD DdMapMemory(PDD_MAPMEMORYDATA lpMapMemory) { PDEV* ppdev; VIDEO_SHARE_MEMORY ShareMemory; VIDEO_SHARE_MEMORY_INFORMATION ShareMemoryInformation; DWORD ReturnedDataLength; ppdev = lpMapMemory->lpDD->dhpdev; if (lpMapMemory->bMap) { ShareMemory.ProcessHandle = lpMapMemory->hProcess; // 'RequestedVirtualAddress' isn't actually used for the SHARE IOCTL. ShareMemory.RequestedVirtualAddress = 0; // We map in starting at the top of the frame buffer. ShareMemory.ViewOffset = 0; // We map down to the end of the frame buffer. // // Note: There is a 64k granularity on the mapping (meaning that we // have to round up to 64k). // // Note: If there is any portion of the frame buffer that must not be // modified by an application, that portion of memory MUST NOT be // mapped in by this call. This would include any data that, if // modified by a malicious application, would cause the driver to // crash. This could include, for example, any DSP code that is // kept in off-screen memory. ShareMemory.ViewSize = ROUND_UP_TO_64K(ppdev->cyMemory * ppdev->lDelta + 0x400000 * 3); if (EngDeviceIoControl(ppdev->hDriver, IOCTL_VIDEO_SHARE_VIDEO_MEMORY, &ShareMemory, sizeof(VIDEO_SHARE_MEMORY), &ShareMemoryInformation, sizeof(VIDEO_SHARE_MEMORY_INFORMATION), &ReturnedDataLength)) { DISPDBG((0, "Failed IOCTL_VIDEO_SHARE_MEMORY")); lpMapMemory->ddRVal = DDERR_GENERIC; return(DDHAL_DRIVER_HANDLED); } lpMapMemory->fpProcess =(FLATPTR)ShareMemoryInformation.VirtualAddress; ppdev->fpBaseOverlay = lpMapMemory->fpProcess; } else { ShareMemory.ProcessHandle = lpMapMemory->hProcess; ShareMemory.ViewOffset = 0; ShareMemory.ViewSize = 0; ShareMemory.RequestedVirtualAddress = (VOID*) lpMapMemory->fpProcess; // // Active movie will unmap memory twice // //if (ppdev->fpBaseOverlay == lpMapMemory->fpProcess) // ppdev->fpBaseOverlay = 0; if (EngDeviceIoControl(ppdev->hDriver, IOCTL_VIDEO_UNSHARE_VIDEO_MEMORY, &ShareMemory, sizeof(VIDEO_SHARE_MEMORY), NULL, 0, &ReturnedDataLength)) { RIP("Failed IOCTL_VIDEO_UNSHARE_MEMORY"); } } lpMapMemory->ddRVal = DD_OK; return(DDHAL_DRIVER_HANDLED); } /******************************Public*Routine******************************\ * DWORD DdGetFlipStatus * * If the display has gone through one refresh cycle since the flip * occurred, we return DD_OK. If it has not gone through one refresh * cycle we return DDERR_WASSTILLDRAWING to indicate that this surface * is still busy "drawing" the flipped page. We also return * DDERR_WASSTILLDRAWING if the bltter is busy and the caller wanted * to know if they could flip yet. * \**************************************************************************/ DWORD DdGetFlipStatus( PDD_GETFLIPSTATUSDATA lpGetFlipStatus) { HRESULT ddRVal; PDEV* ppdev = lpGetFlipStatus->lpDD->dhpdev; // We don't want a flip to work until after the last flip is done, so we ask // for the general flip status and ignore the vmem. //#jc01 ddRVal = UpdateFlipStatus(ppdev, 0); ddRVal = UpdateFlipStatus(ppdev, 0xffffffff); //#jc01 // Check if the blitter is busy if someone wants to know if they can flip. if ((lpGetFlipStatus->dwFlags == DDGFS_CANFLIP) && (ddRVal == DD_OK)) { if (BLT_BUSY(ppdev, ppdev->pjBase)) { ddRVal = DDERR_WASSTILLDRAWING; } } lpGetFlipStatus->ddRVal = ddRVal; return(DDHAL_DRIVER_HANDLED); } /******************************Public*Routine******************************\ * DWORD DdWaitForVerticalBlank * \**************************************************************************/ DWORD DdWaitForVerticalBlank( PDD_WAITFORVERTICALBLANKDATA lpWaitForVerticalBlank) { PDEV* ppdev; BYTE* pjPorts; ppdev = lpWaitForVerticalBlank->lpDD->dhpdev; pjPorts = ppdev->pjPorts; lpWaitForVerticalBlank->ddRVal = DD_OK; switch (lpWaitForVerticalBlank->dwFlags) { case DDWAITVB_I_TESTVB: // If TESTVB, it's just a request for the current vertical blank status. if (CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE) lpWaitForVerticalBlank->bIsInVB = TRUE; else lpWaitForVerticalBlank->bIsInVB = FALSE; return(DDHAL_DRIVER_HANDLED); case DDWAITVB_BLOCKBEGIN: // If BLOCKBEGIN is requested, we wait until the vertical blank is over, // and then wait for the display period to end. while (CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE) ; while (!(CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE)) ; return(DDHAL_DRIVER_HANDLED); case DDWAITVB_BLOCKEND: // If BLOCKEND is requested, we wait for the vblank interval to end. while (!(CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE)) ; while (CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE) ; return(DDHAL_DRIVER_HANDLED); } return(DDHAL_DRIVER_NOTHANDLED); } /******************************Public*Routine******************************\ * DWORD DdGetScanLine * * Reads the scan line currently being scanned by the CRT. * \**************************************************************************/ DWORD DdGetScanLine( PDD_GETSCANLINEDATA lpGetScanLine) { PDEV* ppdev; BYTE* pjPorts; ppdev = (PDEV*) lpGetScanLine->lpDD->dhpdev; pjPorts = ppdev->pjPorts; /* * If a vertical blank is in progress the scan line is in * indeterminant. If the scan line is indeterminant we return * the error code DDERR_VERTICALBLANKINPROGRESS. * Otherwise we return the scan line and a success code */ if( CP_IN_BYTE(pjPorts, STATUS_1) & VBLANK_ACTIVE ) { lpGetScanLine->ddRVal = DDERR_VERTICALBLANKINPROGRESS; } else { lpGetScanLine->dwScanLine = GetCurrentVLine(ppdev); lpGetScanLine->ddRVal = DD_OK; } return(DDHAL_DRIVER_HANDLED); } /******************************Public*Routine******************************\ * DWORD DdCanCreateSurface * \**************************************************************************/ DWORD DdCanCreateSurface( PDD_CANCREATESURFACEDATA lpCanCreateSurface) { PDEV* ppdev; DWORD dwRet; LPDDSURFACEDESC lpSurfaceDesc; ppdev = (PDEV*) lpCanCreateSurface->lpDD->dhpdev; lpSurfaceDesc = lpCanCreateSurface->lpDDSurfaceDesc; dwRet = DDHAL_DRIVER_NOTHANDLED; DISPDBG((2, "DdCanCreateSurface Entered")); if (!lpCanCreateSurface->bIsDifferentPixelFormat) { // It's trivially easy to create plain surfaces that are the same // type as the primary surface: dwRet = DDHAL_DRIVER_HANDLED; } else if (ppdev->flStatus & STAT_STREAMS_ENABLED) { // When using the Streams processor, we handle only overlays of // different pixel formats -- not any off-screen memory: if (lpSurfaceDesc->ddsCaps.dwCaps & DDSCAPS_OVERLAY) { /* * YUV Planar surfaces cannot co-exist with other overlay surfaces. */ if (ppdev->OvlyCnt >= 1) { lpCanCreateSurface->ddRVal = DDERR_OUTOFCAPS; return (DDHAL_DRIVER_HANDLED); } if ((lpSurfaceDesc->ddpfPixelFormat.dwFourCC == FOURCC_YUVPLANAR) && ppdev->OvlyCnt) { lpCanCreateSurface->ddRVal = DDERR_INVALIDPIXELFORMAT; return (DDHAL_DRIVER_HANDLED); } else if (ppdev->PlanarCnt) { lpCanCreateSurface->ddRVal = DDERR_INVALIDPIXELFORMAT; return (DDHAL_DRIVER_HANDLED); } // We handle four types of YUV overlay surfaces: if (lpSurfaceDesc->ddpfPixelFormat.dwFlags & DDPF_FOURCC) { // Check first for a supported YUV type: if (lpSurfaceDesc->ddpfPixelFormat.dwFourCC == FOURCC_YUV422) { lpSurfaceDesc->ddpfPixelFormat.dwYUVBitCount = 16; dwRet = DDHAL_DRIVER_HANDLED; } else if ((lpSurfaceDesc->ddpfPixelFormat.dwFourCC == FOURCC_YUY2) && ((ppdev->ulChipID != 0x40) && (ppdev->ulChipID != 0x4C)) ) //tao1 { lpSurfaceDesc->ddpfPixelFormat.dwYUVBitCount = 16; dwRet = DDHAL_DRIVER_HANDLED; } else if (lpSurfaceDesc->ddpfPixelFormat.dwFourCC == FOURCC_PACKJR) { if( ppdev->cBitsPerPixel <= 16) { lpSurfaceDesc->ddpfPixelFormat.dwYUVBitCount = 8; dwRet = DDHAL_DRIVER_HANDLED; } } else if (lpSurfaceDesc->ddpfPixelFormat.dwFourCC == FOURCC_YUVPLANAR) { lpSurfaceDesc->ddpfPixelFormat.dwYUVBitCount = 8; dwRet = DDHAL_DRIVER_HANDLED; } } else if (lpSurfaceDesc->ddpfPixelFormat.dwFlags & DDPF_RGB) { if((lpSurfaceDesc->ddpfPixelFormat.dwFlags & DDPF_PALETTEINDEXED8) && ppdev->cBitsPerPixel == 16 ) { dwRet = DDHAL_DRIVER_HANDLED; } else if (lpSurfaceDesc->ddpfPixelFormat.dwRGBBitCount == 16) { dwRet = DDHAL_DRIVER_HANDLED; } } } } // Print some spew if this was a surface we refused to create: if (dwRet == DDHAL_DRIVER_NOTHANDLED) { if (lpSurfaceDesc->ddpfPixelFormat.dwFlags & DDPF_RGB) { DISPDBG((0, "Failed creation of %libpp RGB surface %lx %lx %lx", lpSurfaceDesc->ddpfPixelFormat.dwRGBBitCount, lpSurfaceDesc->ddpfPixelFormat.dwRBitMask, lpSurfaceDesc->ddpfPixelFormat.dwGBitMask, lpSurfaceDesc->ddpfPixelFormat.dwBBitMask)); } else { DISPDBG((0, "Failed creation of type 0x%lx YUV 0x%lx surface", lpSurfaceDesc->ddpfPixelFormat.dwFlags, lpSurfaceDesc->ddpfPixelFormat.dwFourCC)); } } lpCanCreateSurface->ddRVal = DD_OK; return(dwRet); } /******************************Public*Routine******************************\ * DWORD DdCreateSurface * \**************************************************************************/ DWORD DdCreateSurface( PDD_CREATESURFACEDATA lpCreateSurface) { PDEV* ppdev; DD_SURFACE_LOCAL* lpSurfaceLocal; DD_SURFACE_GLOBAL* lpSurfaceGlobal; LPDDSURFACEDESC lpSurfaceDesc; DWORD dwByteCount; LONG lLinearPitch; DWORD dwHeight; ppdev = (PDEV*) lpCreateSurface->lpDD->dhpdev; DISPDBG((2, "DdCreateSurface Entered")); // On Windows NT, dwSCnt will always be 1, so there will only ever // be one entry in the 'lplpSList' array: lpSurfaceLocal = lpCreateSurface->lplpSList[0]; lpSurfaceGlobal = lpSurfaceLocal->lpGbl; lpSurfaceDesc = lpCreateSurface->lpDDSurfaceDesc; // We repeat the same checks we did in 'DdCanCreateSurface' because // it's possible that an application doesn't call 'DdCanCreateSurface' // before calling 'DdCreateSurface'. ASSERTDD(lpSurfaceGlobal->ddpfSurface.dwSize == sizeof(DDPIXELFORMAT), "NT is supposed to guarantee that ddpfSurface.dwSize is valid"); // DdCanCreateSurface already validated whether the hardware supports // the surface, so we don't need to do any validation here. We'll // just go ahead and allocate it. // // Note that we don't do anything special for RGB surfaces that are // the same pixel format as the display -- by returning DDHAL_DRIVER_ // NOTHANDLED, DirectDraw will automatically handle the allocation // for us. // // Also, since we'll be making linear surfaces, make sure the width // isn't unreasonably large. // // Note that on NT, an overlay can be created only if the driver // okay's it here in this routine. Under Win95, the overlay will be // created automatically if it's the same pixel format as the primary // display. if ((lpSurfaceLocal->ddsCaps.dwCaps & DDSCAPS_OVERLAY) || (lpSurfaceGlobal->ddpfSurface.dwFlags & DDPF_FOURCC) || (lpSurfaceGlobal->ddpfSurface.dwRBitMask != ppdev->flRed)) { if (lpSurfaceGlobal->wWidth <= (DWORD) ppdev->cxMemory) { lLinearPitch = (lpSurfaceGlobal->wWidth + 7) & ~7; if (lpSurfaceGlobal->ddpfSurface.dwFlags & DDPF_FOURCC) { ASSERTDD((lpSurfaceGlobal->ddpfSurface.dwFourCC == FOURCC_YUV422) || (lpSurfaceGlobal->ddpfSurface.dwFourCC == FOURCC_YUY2) || (lpSurfaceGlobal->ddpfSurface.dwFourCC == FOURCC_PACKJR) || (lpSurfaceGlobal->ddpfSurface.dwFourCC == FOURCC_YUVPLANAR), "Expected our DdCanCreateSurface to allow only UYVY, YUY2, CLPJ, CLPL"); if((lpSurfaceGlobal->ddpfSurface.dwFourCC == FOURCC_YUV422) || (lpSurfaceGlobal->ddpfSurface.dwFourCC == FOURCC_YUY2)) { dwByteCount = 2; lLinearPitch <<= 1; lpSurfaceLocal->dwReserved1 |= OVERLAY_FLG_YUV422; } else if((lpSurfaceGlobal->ddpfSurface.dwFourCC == FOURCC_PACKJR)) { dwByteCount = 1; lpSurfaceLocal->dwReserved1 |= OVERLAY_FLG_PACKJR; } else if((lpSurfaceGlobal->ddpfSurface.dwFourCC == FOURCC_YUVPLANAR)) { dwByteCount = 1; lpSurfaceLocal->dwReserved1 |= OVERLAY_FLG_YUVPLANAR; } else { dwByteCount = 1; DISPDBG((1, "Created RGB %libpp: %li x %li Red: %lx", 8 * dwByteCount, lpSurfaceGlobal->wWidth, lpSurfaceGlobal->wHeight, lpSurfaceGlobal->ddpfSurface.dwRBitMask)); } // We have to fill in the bit-count for FourCC surfaces: lpSurfaceGlobal->ddpfSurface.dwYUVBitCount = 8 * dwByteCount; lpSurfaceGlobal->ddpfSurface.dwYBitMask = (DWORD)-1; lpSurfaceGlobal->ddpfSurface.dwUBitMask = (DWORD)-1; lpSurfaceGlobal->ddpfSurface.dwVBitMask = (DWORD)-1; DISPDBG((1, "Created YUV: %li x %li", lpSurfaceGlobal->wWidth, lpSurfaceGlobal->wHeight)); } else { dwByteCount = lpSurfaceGlobal->ddpfSurface.dwRGBBitCount >> 3; if (dwByteCount == 2) lLinearPitch <<= 1; DISPDBG((1, "Created RGB %libpp: %li x %li Red: %lx", 8 * dwByteCount, lpSurfaceGlobal->wWidth, lpSurfaceGlobal->wHeight, lpSurfaceGlobal->ddpfSurface.dwRBitMask)); } // We want to allocate a linear surface to store the FourCC // surface, but DirectDraw is using a 2-D heap-manager because // the rest of our surfaces have to be 2-D. So here we have to // convert the linear size to a 2-D size. // // The stride has to be a dword multiple: dwHeight = (lpSurfaceGlobal->wHeight * lLinearPitch + ppdev->lDelta - 1) / ppdev->lDelta; // Now fill in enough stuff to have the DirectDraw heap-manager // do the allocation for us: lpSurfaceGlobal->fpVidMem = DDHAL_PLEASEALLOC_BLOCKSIZE; lpSurfaceGlobal->dwBlockSizeX = ppdev->lDelta; // Specified in bytes lpSurfaceGlobal->dwBlockSizeY = dwHeight; lpSurfaceGlobal->lPitch = lLinearPitch; lpSurfaceDesc->lPitch = lLinearPitch; lpSurfaceDesc->dwFlags |= DDSD_PITCH; lpSurfaceLocal->dwReserved1 |= OVERLAY_FLG_OVERLAY; if (lpSurfaceGlobal->ddpfSurface.dwFourCC == FOURCC_YUVPLANAR) { ppdev->PlanarCnt++; } else { ppdev->OvlyCnt++; } ppdev->fpBaseOverlay = 0xffffffff; } else { DISPDBG((1, "Refused to create surface with large width")); } } return(DDHAL_DRIVER_NOTHANDLED); } /******************************Public*Routine******************************\ * DWORD DdDestroySurface * \**************************************************************************/ DWORD DdDestroySurface (PDD_DESTROYSURFACEDATA lpDestroySurface) { PDEV* ppdev; BYTE* pjPorts; ppdev = (PDEV*) lpDestroySurface->lpDD->dhpdev; pjPorts = ppdev->pjPorts; DISPDBG((2, "In DestroyOverlaySurface")); if (lpDestroySurface->lpDDSurface->dwReserved1 & OVERLAY_FLG_ENABLED) { BYTE bTemp; /* * Turn the video off */ DISPDBG((1,"Turning off video in DestroySurface")); ppdev->pfnDisableOverlay(ppdev); ppdev->pfnClearAltFIFOThreshold(ppdev); if (lpDestroySurface->lpDDSurface->dwReserved1 & OVERLAY_FLG_COLOR_KEY) { CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x1a); bTemp = CP_IN_BYTE(pjPorts, CRTC_DATA); // Clear CR1A[3:2] CP_OUT_BYTE(pjPorts, CRTC_DATA, bTemp & ~0x0C); } /* * Turn off YUV Planar */ if (lpDestroySurface->lpDDSurface->dwReserved1 & OVERLAY_FLG_YUVPLANAR) { CP_OUT_WORD(pjPorts, CRTC_INDEX, (0x00 << 8) | 0x3f); // Turn off YUV Planar } ppdev->fpVisibleOverlay = (FLATPTR)NULL; ppdev->dwPanningFlag &= ~OVERLAY_OLAY_SHOW; } if (lpDestroySurface->lpDDSurface->dwReserved1 & OVERLAY_FLG_YUVPLANAR) { if (ppdev->PlanarCnt > 0) ppdev->PlanarCnt--; } else { if (ppdev->OvlyCnt > 0) ppdev->OvlyCnt--; } if (lpDestroySurface->lpDDSurface->ddsCaps.dwCaps & DDSCAPS_LIVEVIDEO) { BYTE bTemp; CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x51); bTemp= CP_IN_BYTE(pjPorts, CRTC_DATA); CP_OUT_BYTE(pjPorts, CRTC_DATA, bTemp & ~0x08); } return(DDHAL_DRIVER_NOTHANDLED); } /******************************Public*Routine******************************\ * DWORD DdSetColorKey * \**************************************************************************/ DWORD DdSetColorKey( PDD_SETCOLORKEYDATA lpSetColorKey) { PDEV* ppdev; BYTE* pjPorts; BYTE* pjBase; DD_SURFACE_GLOBAL* lpSurface; DWORD dwKeyLow; DWORD dwKeyHigh; ppdev = (PDEV*) lpSetColorKey->lpDD->dhpdev; DISPDBG((2, "DdSetColorKey Entered")); ASSERTDD(ppdev->flStatus & STAT_STREAMS_ENABLED, "Shouldn't have hooked call"); pjPorts = ppdev->pjPorts; pjBase = ppdev->pjBase; lpSurface = lpSetColorKey->lpDDSurface->lpGbl; // We don't have to do anything for normal blt source colour keys: if (lpSetColorKey->dwFlags & DDCKEY_SRCBLT) { lpSetColorKey->ddRVal = DD_OK; return(DDHAL_DRIVER_HANDLED); } else if ((lpSetColorKey->dwFlags & DDCKEY_DESTOVERLAY) && (lpSetColorKey->lpDDSurface == ppdev->lpColorSurface)) { if (lpSurface->fpVidMem == ppdev->fpVisibleOverlay) { ppdev->wColorKey = (WORD) lpSetColorKey->ckNew.dwColorSpaceLowValue; ppdev->pfnRegInitVideo(ppdev, lpSetColorKey->lpDDSurface); } lpSetColorKey->ddRVal = DD_OK; return(DDHAL_DRIVER_HANDLED); } else if ((lpSetColorKey->dwFlags & DDCKEY_SRCOVERLAY) && (lpSetColorKey->lpDDSurface == ppdev->lpSrcColorSurface)) { if (lpSurface->fpVidMem == ppdev->fpVisibleOverlay) { ppdev->dwSrcColorKeyLow = lpSetColorKey->ckNew.dwColorSpaceLowValue; ppdev->dwSrcColorKeyHigh = lpSetColorKey->ckNew.dwColorSpaceHighValue; if (ppdev->dwSrcColorKeyLow > ppdev->dwSrcColorKeyHigh) { ppdev->dwSrcColorKeyHigh = ppdev->dwSrcColorKeyLow; } ppdev->pfnRegInitVideo(ppdev, lpSetColorKey->lpDDSurface); } lpSetColorKey->ddRVal = DD_OK; return(DDHAL_DRIVER_HANDLED); } DISPDBG((1, "DdSetColorKey: Invalid command")); return(DDHAL_DRIVER_NOTHANDLED); } /******************************Public*Routine******************************\ * DWORD DdUpdateOverlay * \**************************************************************************/ DWORD DdUpdateOverlay( PDD_UPDATEOVERLAYDATA lpUpdateOverlay) { PDEV* ppdev; BYTE* pjPorts; BYTE* pjBase; DD_SURFACE_GLOBAL* lpSource; DD_SURFACE_GLOBAL* lpDestination; DWORD dwStride; LONG srcWidth; LONG srcHeight; LONG dstWidth; LONG dstHeight; DWORD dwBitCount; DWORD dwStart; DWORD dwTmp; BOOL bColorKey; DWORD dwKeyLow; DWORD dwKeyHigh; DWORD dwBytesPerPixel; DWORD dwSecCtrl; DWORD dwBlendCtrl; DWORD dwFourcc; BOOL bCheckBandwidth; WORD wBitCount; DWORD_PTR dwOldStatus; BYTE bTemp; ppdev = (PDEV*) lpUpdateOverlay->lpDD->dhpdev; DISPDBG((2, "DdUpdateOverlay Entered")); ASSERTDD(ppdev->flStatus & STAT_STREAMS_ENABLED, "Shouldn't have hooked call"); pjPorts = ppdev->pjPorts; pjBase = ppdev->pjBase; //myf33 begin // Initialize the bandwidth registers Regs.bSR2F = 0; Regs.bSR32 = 0; Regs.bSR34 = 0; Regs.bCR42 = 0; //myf33 end if (lpUpdateOverlay->lpDDSrcSurface->dwFlags & DDRAWISURF_HASPIXELFORMAT) { GetFormatInfo(ppdev, &(lpUpdateOverlay->lpDDSrcSurface->lpGbl->ddpfSurface), &dwFourcc, &wBitCount); } else { // This needs to be changed when primary surface is RGB 5:6:5 dwFourcc = BI_RGB; wBitCount = (WORD) ppdev->cBitsPerPixel; } /* * Are we color keying? */ bCheckBandwidth = TRUE; ppdev->lpColorSurface = ppdev->lpSrcColorSurface = NULL; dwOldStatus = lpUpdateOverlay->lpDDSrcSurface->dwReserved1; if ((lpUpdateOverlay->dwFlags & (DDOVER_KEYDEST | DDOVER_KEYDESTOVERRIDE)) && (lpUpdateOverlay->dwFlags & (DDOVER_KEYSRC | DDOVER_KEYSRCOVERRIDE))) { /* * Cannot perform src colorkey and dest colorkey at the same time */ lpUpdateOverlay->ddRVal = DDERR_NOCOLORKEYHW; return (DDHAL_DRIVER_HANDLED); } lpUpdateOverlay->lpDDSrcSurface->dwReserved1 &= ~(OVERLAY_FLG_COLOR_KEY|OVERLAY_FLG_SRC_COLOR_KEY); if (lpUpdateOverlay->dwFlags & (DDOVER_KEYDEST | DDOVER_KEYDESTOVERRIDE)) { if (ppdev->pfnIsSufficientBandwidth(ppdev, wBitCount, &(lpUpdateOverlay->rSrc), &(lpUpdateOverlay->rDest), OVERLAY_FLG_COLOR_KEY)) { bCheckBandwidth = FALSE; lpUpdateOverlay->lpDDSrcSurface->dwReserved1 |= OVERLAY_FLG_COLOR_KEY; if (lpUpdateOverlay->dwFlags & DDOVER_KEYDEST) { ppdev->wColorKey = (WORD) lpUpdateOverlay->lpDDDestSurface->ddckCKDestOverlay.dwColorSpaceLowValue; ppdev->lpColorSurface = lpUpdateOverlay->lpDDDestSurface; } else { ppdev->wColorKey = (WORD) lpUpdateOverlay->overlayFX.dckDestColorkey.dwColorSpaceLowValue; } } else { lpUpdateOverlay->ddRVal = DDERR_NOCOLORKEYHW; return (DDHAL_DRIVER_HANDLED); } } else if (lpUpdateOverlay->dwFlags & (DDOVER_KEYSRC | DDOVER_KEYSRCOVERRIDE)) { if (ppdev->pfnIsSufficientBandwidth(ppdev, wBitCount, &(lpUpdateOverlay->rSrc), &(lpUpdateOverlay->rDest), OVERLAY_FLG_SRC_COLOR_KEY)) { bCheckBandwidth = FALSE; lpUpdateOverlay->lpDDSrcSurface->dwReserved1 |= OVERLAY_FLG_SRC_COLOR_KEY; ppdev->lpSrcColorSurface = lpUpdateOverlay->lpDDSrcSurface; if (lpUpdateOverlay->dwFlags & DDOVER_KEYSRC) { ppdev->dwSrcColorKeyLow = lpUpdateOverlay->lpDDSrcSurface->ddckCKSrcOverlay.dwColorSpaceLowValue; ppdev->dwSrcColorKeyHigh = lpUpdateOverlay->lpDDSrcSurface->ddckCKSrcOverlay.dwColorSpaceHighValue; } else { ppdev->dwSrcColorKeyLow = lpUpdateOverlay->overlayFX.dckSrcColorkey.dwColorSpaceLowValue; ppdev->dwSrcColorKeyHigh = lpUpdateOverlay->overlayFX.dckSrcColorkey.dwColorSpaceHighValue; } if (ppdev->dwSrcColorKeyHigh < ppdev->dwSrcColorKeyHigh) { ppdev->dwSrcColorKeyHigh = ppdev->dwSrcColorKeyLow; } } else { DISPDBG((0, "Insufficient bandwidth for colorkeying")); lpUpdateOverlay->ddRVal = DDERR_NOCOLORKEYHW; return (DDHAL_DRIVER_HANDLED); } } // 'Source' is the overlay surface, 'destination' is the surface to // be overlayed: lpSource = lpUpdateOverlay->lpDDSrcSurface->lpGbl; if (lpUpdateOverlay->dwFlags & DDOVER_HIDE) { if (lpSource->fpVidMem == ppdev->fpVisibleOverlay) { /* * Turn the video off */ ppdev->pfnDisableOverlay(ppdev); ppdev->pfnClearAltFIFOThreshold(ppdev); /* * If we are color keying, we will disable that now */ if (dwOldStatus & OVERLAY_FLG_COLOR_KEY) { CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x1a); bTemp = CP_IN_BYTE(pjPorts, CRTC_DATA); // Clear CR1A[3:2] CP_OUT_BYTE(pjPorts, CRTC_DATA, bTemp & ~0x0C); } ppdev->dwPanningFlag &= ~OVERLAY_OLAY_SHOW; lpUpdateOverlay->lpDDSrcSurface->dwReserved1 &= ~OVERLAY_FLG_ENABLED; ppdev->fpVisibleOverlay = 0; } lpUpdateOverlay->ddRVal = DD_OK; return(DDHAL_DRIVER_HANDLED); } // Dereference 'lpDDDestSurface' only after checking for the DDOVER_HIDE // case: #if 0 /* * Turn the video off first to protect side effect when moving. * Later RegIniVideo will turn it on if needed. */ CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x3e); bTemp = CP_IN_BYTE(pjPorts, CRTC_DATA); CP_OUT_BYTE(pjPorts, CRTC_DATA, bTemp & ~0x01); // Clear CR3E[0] #endif lpDestination = lpUpdateOverlay->lpDDDestSurface->lpGbl; if (lpSource->fpVidMem != ppdev->fpVisibleOverlay) { if (lpUpdateOverlay->dwFlags & DDOVER_SHOW) { if (ppdev->fpVisibleOverlay != 0) { // Some other overlay is already visible: DISPDBG((0, "DdUpdateOverlay: An overlay is already visible")); lpUpdateOverlay->ddRVal = DDERR_OUTOFCAPS; return(DDHAL_DRIVER_HANDLED); } else { // We're going to make the overlay visible, so mark it as // such: ppdev->fpVisibleOverlay = lpSource->fpVidMem; } } else { // The overlay isn't visible, and we haven't been asked to make // it visible, so this call is trivially easy: lpUpdateOverlay->ddRVal = DD_OK; return(DDHAL_DRIVER_HANDLED); } } /* * Is there sufficient bandwidth to work? */ if (bCheckBandwidth && !ppdev->pfnIsSufficientBandwidth(ppdev, wBitCount, &(lpUpdateOverlay->rSrc), &(lpUpdateOverlay->rDest), 0)) { lpUpdateOverlay->ddRVal = DDERR_OUTOFCAPS; return (DDHAL_DRIVER_HANDLED); } /* * Save the rectangles */ ppdev->rOverlaySrc = lpUpdateOverlay->rSrc; ppdev->rOverlayDest = lpUpdateOverlay->rDest; if (lpUpdateOverlay->lpDDSrcSurface->dwReserved1 & OVERLAY_FLG_DECIMATE) { ppdev->rOverlaySrc.right = ppdev->rOverlaySrc.left + ((ppdev->rOverlaySrc.right - ppdev->rOverlaySrc.left) >> 1); } if (ppdev->rOverlaySrc.right - ppdev->rOverlaySrc.left <= MIN_OLAY_WIDTH) { lpUpdateOverlay->ddRVal = DDERR_OUTOFCAPS; return (DDHAL_DRIVER_HANDLED); } lpUpdateOverlay->lpDDSrcSurface->dwReserved1 |= OVERLAY_FLG_ENABLED; // // Assign 5c to 1F when video is on while no color key for 5446BE. // // sge04 //if (bCheckBandwidth && ppdev->flCaps & CAPS_SECOND_APERTURE) if (ppdev->flCaps & CAPS_SECOND_APERTURE) ppdev->lFifoThresh = 0x0E; ppdev->pfnRegInitVideo(ppdev, lpUpdateOverlay->lpDDSrcSurface); lpUpdateOverlay->ddRVal = DD_OK; return(DDHAL_DRIVER_HANDLED); } /******************************Public*Routine******************************\ * DWORD DdSetOverlayPosition * \**************************************************************************/ DWORD DdSetOverlayPosition( PDD_SETOVERLAYPOSITIONDATA lpSetOverlayPosition) { PDEV* ppdev; BYTE* pjPorts; BYTE* pjBase; ppdev = (PDEV*) lpSetOverlayPosition->lpDD->dhpdev; pjPorts = ppdev->pjPorts; pjBase = ppdev->pjBase; DISPDBG((2, "DdSetOverlayPosition Entered")); ASSERTDD(ppdev->flStatus & STAT_STREAMS_ENABLED, "Shouldn't have hooked call"); if(lpSetOverlayPosition->lpDDSrcSurface->lpGbl->fpVidMem == ppdev->fpVisibleOverlay) { /* * Update the rectangles */ ppdev->rOverlayDest.right = (ppdev->rOverlayDest.right - ppdev->rOverlayDest.left) + lpSetOverlayPosition->lXPos; ppdev->rOverlayDest.left = lpSetOverlayPosition->lXPos; ppdev->rOverlayDest.bottom = (ppdev->rOverlayDest.bottom - ppdev->rOverlayDest.top) + lpSetOverlayPosition->lYPos; ppdev->rOverlayDest.top = lpSetOverlayPosition->lYPos; //myf29 RegMoveVideo(ppdev, lpSetOverlayPosition->lpDDSrcSurface); ppdev->pfnRegMoveVideo(ppdev, lpSetOverlayPosition->lpDDSrcSurface); } lpSetOverlayPosition->ddRVal = DD_OK; return(DDHAL_DRIVER_HANDLED); } /******************************************************************************\ * * Function: DrvGetDirectDrawInfo * * This function returns te capabilities of the DirectDraw implementation. It is * called twice during the connect phase. * * Parameters: dhpdev Handle to physical device. * pHalInfo Pointer to a DD_HALINFO structure. * pdwNumHeaps Pointer to a variable that holds the number of * heaps. * pvmList Pointer to the heap array. * pdwNumFourCC Pointer to a variable that holds the number of * FourCC IDs. * pdwFourCC Pointer to FourCC IDs. * * Returns: TRUE if successful. * \******************************************************************************/ BOOL DrvGetDirectDrawInfo( DHPDEV dhpdev, DD_HALINFO* pHalInfo, DWORD* pdwNumHeaps, VIDEOMEMORY* pvmList, DWORD* pdwNumFourCC, DWORD* pdwFourCC) { BOOL bCanFlip; PDEV* ppdev = (PPDEV) dhpdev; LONGLONG li; OH* poh; RECTL rSrc, rDest; LONG lZoom; BYTE* pjPorts = ppdev->pjPorts; BYTE bTemp; // We may not support DirectDraw on this card. if (!(ppdev->flStatus & STAT_DIRECTDRAW)) { return(FALSE); } DISPDBG((2, "DrvGetDirectDrawInfo Entered")); pHalInfo->dwSize = sizeof(DD_HALINFO); // Current primary surface attributes. Since HalInfo is zero-initialized by // GDI, we only have to fill in the fields which should be non-zero. pHalInfo->vmiData.pvPrimary = ppdev->pjScreen; pHalInfo->vmiData.dwDisplayWidth = ppdev->cxScreen; pHalInfo->vmiData.dwDisplayHeight = ppdev->cyScreen; pHalInfo->vmiData.lDisplayPitch = ppdev->lDelta; pHalInfo->vmiData.dwOffscreenAlign = 4; pHalInfo->vmiData.ddpfDisplay.dwSize = sizeof(DDPIXELFORMAT); pHalInfo->vmiData.ddpfDisplay.dwFlags = DDPF_RGB; pHalInfo->vmiData.ddpfDisplay.dwRGBBitCount = ppdev->cBitsPerPixel; if (ppdev->cBpp == 1) { pHalInfo->vmiData.ddpfDisplay.dwFlags |= DDPF_PALETTEINDEXED8; } // These masks will be zero at 8bpp. pHalInfo->vmiData.ddpfDisplay.dwRBitMask = ppdev->flRed; pHalInfo->vmiData.ddpfDisplay.dwGBitMask = ppdev->flGreen; pHalInfo->vmiData.ddpfDisplay.dwBBitMask = ppdev->flBlue; if (ppdev->cBpp == 4) { pHalInfo->vmiData.ddpfDisplay.dwRGBAlphaBitMask = ~(ppdev->flRed | ppdev->flGreen | ppdev->flBlue); } // Set up the pointer to the first available video memory after the primary // surface. bCanFlip = FALSE; *pdwNumHeaps = 0; // Free up as much off-screen memory as possible. bMoveAllDfbsFromOffscreenToDibs(ppdev); // Move all DFBs to DIB.s vAssertModeText(ppdev, FALSE); // Destroy all cached fonts. if ((ppdev->ulChipID == CL7555_ID) || (ppdev->ulChipID == CL7556_ID))//myf32 { MIN_OLAY_WIDTH = 16; #if (_WIN32_WINNT >= 0x0400) ppdev->flCaps |= CAPS_VIDEO; #endif ppdev->pfnIsSufficientBandwidth=Is7555SufficientBandwidth; ppdev->pfnRegInitVideo=RegInit7555Video; ppdev->pfnRegMoveVideo=RegMove7555Video; ppdev->pfnDisableOverlay=DisableVideoWindow; ppdev->pfnClearAltFIFOThreshold=ClearAltFIFOThreshold; } else { ppdev->pfnIsSufficientBandwidth = (ppdev->ulChipID != 0xBC) ? IsSufficientBandwidth : Is5480SufficientBandwidth ; // chu03 ppdev->pfnRegInitVideo=RegInitVideo; ppdev->pfnRegMoveVideo=RegMoveVideo; ppdev->pfnDisableOverlay=DisableOverlay_544x; ppdev->pfnClearAltFIFOThreshold=ClearAltFIFOThreshold_544x; } // Now simply reserve the biggest chunk for use by DirectDraw. poh = ppdev->pohDirectDraw; #if (DIRECTX_24 < 2) if ((poh == NULL) && (ppdev->cBpp != 3)) #else if (poh == NULL) #endif { LONG cxMax, cyMax; cxMax = ppdev->heap.cxMax & ~(HEAP_X_ALIGNMENT - 1); cyMax = ppdev->heap.cyMax; poh = pohAllocatePermanent(ppdev, cxMax, cyMax); if (poh == NULL) { // Could not allocate all memory, find the biggest area now. cxMax = cyMax = 0; for (poh = ppdev->heap.ohAvailable.pohNext; poh != &ppdev->heap.ohAvailable; poh = poh->pohNext) { if ((poh->cx * poh->cy) > (cxMax * cyMax)) { cxMax = poh->cx & ~(HEAP_X_ALIGNMENT - 1); cyMax = poh->cy; } } poh = pohAllocatePermanent(ppdev, cxMax, cyMax); } ppdev->pohDirectDraw = poh; } if (poh != NULL) { *pdwNumHeaps = 1; // Fill in the list of off-screen rectangles if we've been asked to do // so. if (pvmList != NULL) { DISPDBG((1, "DirectDraw gets %d x %d surface at (%d, %d)", poh->cx, poh->cy, poh->x, poh->y)); #if 0 if (PELS_TO_BYTES(poh->cx) != ppdev->lDelta) { #endif pvmList->dwFlags = VIDMEM_ISRECTANGULAR; pvmList->fpStart = poh->xy; pvmList->dwWidth = PELS_TO_BYTES(poh->cx); pvmList->dwHeight = poh->cy; #if 0 } else { pvmList->dwFlags = VIDMEM_ISLINEAR; pvmList->fpStart = poh->xy; pvmList->fpEnd = poh->xy - 1 + PELS_TO_BYTES(poh->cx) + poh->cy * ppdev->lDelta; } #endif pvmList->ddsCaps.dwCaps = DDSCAPS_OFFSCREENPLAIN; if ((poh->cx >= ppdev->cxScreen) && (poh->cy >= ppdev->cyScreen)) { bCanFlip = TRUE; } } } // Capabilities supported. pHalInfo->ddCaps.dwFXCaps = 0; pHalInfo->ddCaps.dwCaps = DDCAPS_BLT | DDCAPS_BLTCOLORFILL | DDCAPS_READSCANLINE; // sge08 add this bit pHalInfo->ddCaps.dwCaps2 = DDCAPS2_COPYFOURCC; if ( (ppdev->flCaps & CAPS_VIDEO) && (ppdev->cBpp <= 2) ) { pHalInfo->ddCaps.dwCaps |= DDCAPS_COLORKEY; pHalInfo->ddCaps.dwCKeyCaps = DDCKEYCAPS_SRCBLT; } pHalInfo->ddCaps.ddsCaps.dwCaps = DDSCAPS_OFFSCREENPLAIN | DDSCAPS_PRIMARYSURFACE; if (bCanFlip) { pHalInfo->ddCaps.ddsCaps.dwCaps |= DDSCAPS_FLIP; } // FourCCs supported. *pdwNumFourCC = 0; #if 0 // smac - disable overlays due to too many bugs { // // Interlaced mode ? // BOOL Interlaced ; // chu02 CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x1a) ; Interlaced = CP_IN_BYTE(pjPorts, CRTC_DATA) & 0x01 ; // // Needs check more later // if ((ppdev->flCaps & CAPS_VIDEO) && (!Interlaced)) // chu02 ppdev->flStatus |= STAT_STREAMS_ENABLED; if (ppdev->flStatus & STAT_STREAMS_ENABLED) { /* * Are we double clocked? */ ppdev->bDoubleClock = FALSE; // // use SR7 to check the double clock instead of hidden register // // CP_OUT_BYTE(pjPorts, SR_INDEX, 0x7); bTemp = CP_IN_BYTE(pjPorts, SR_DATA); if ((((bTemp & 0x0E) == 0x06) && ppdev->cBitsPerPixel == 8) || (((bTemp & 0x0E) == 0x08) && ppdev->cBitsPerPixel == 16)) { ppdev->bDoubleClock = TRUE; } pHalInfo->vmiData.dwOverlayAlign = 8; pHalInfo->ddCaps.dwCaps |= DDCAPS_OVERLAY | DDCAPS_OVERLAYSTRETCH | DDCAPS_OVERLAYFOURCC | DDCAPS_OVERLAYCANTCLIP | DDCAPS_ALIGNSTRIDE; pHalInfo->ddCaps.dwFXCaps |= DDFXCAPS_OVERLAYSTRETCHX | DDFXCAPS_OVERLAYSTRETCHY | DDFXCAPS_OVERLAYARITHSTRETCHY; pHalInfo->ddCaps.dwCKeyCaps |= DDCKEYCAPS_DESTOVERLAY | DDCKEYCAPS_DESTOVERLAYYUV | DDCKEYCAPS_DESTOVERLAYONEACTIVE; pHalInfo->ddCaps.dwCKeyCaps |= DDCKEYCAPS_SRCOVERLAY | DDCKEYCAPS_SRCOVERLAYCLRSPACE | DDCKEYCAPS_SRCOVERLAYCLRSPACEYUV | DDCKEYCAPS_SRCOVERLAYONEACTIVE | DDCKEYCAPS_SRCOVERLAYYUV; pHalInfo->ddCaps.ddsCaps.dwCaps |= DDSCAPS_OVERLAY; *pdwNumFourCC = 3; if ((ppdev->ulChipID == 0x40) || (ppdev->ulChipID == 0x4C)) //tao1 *pdwNumFourCC = 2; //tao1 if (pdwFourCC) { pdwFourCC[0] = FOURCC_YUV422; pdwFourCC[1] = FOURCC_PACKJR; if ((ppdev->ulChipID != 0x40) && (ppdev->ulChipID != 0x4C)) //tao1 pdwFourCC[2] = FOURCC_YUY2; //tao1 } pHalInfo->ddCaps.dwMaxVisibleOverlays = 1; pHalInfo->ddCaps.dwCurrVisibleOverlays = 0; pHalInfo->ddCaps.dwNumFourCCCodes = 2; # if 1 pHalInfo->ddCaps.dwAlignBoundarySrc = 1; pHalInfo->ddCaps.dwAlignSizeSrc = 1; // chu01 sge05 #if 1 if ((ppdev->cBpp == 3) || ppdev->bDoubleClock ) { pHalInfo->ddCaps.dwAlignBoundaryDest = 4; pHalInfo->ddCaps.dwAlignSizeDest = 4; } else { pHalInfo->ddCaps.dwAlignBoundaryDest = 1; pHalInfo->ddCaps.dwAlignSizeDest = 1; } #else pHalInfo->ddCaps.dwAlignBoundaryDest = 1; pHalInfo->ddCaps.dwAlignSizeDest = 1; #endif // 1 pHalInfo->ddCaps.dwAlignStrideAlign = 8; pHalInfo->ddCaps.dwMinOverlayStretch = 8000; pHalInfo->ddCaps.dwMinLiveVideoStretch = 8000; pHalInfo->ddCaps.dwMinHwCodecStretch = 8000; pHalInfo->ddCaps.dwMaxOverlayStretch = 8000; pHalInfo->ddCaps.dwMaxLiveVideoStretch = 8000; pHalInfo->ddCaps.dwMaxHwCodecStretch = 8000; // // maybe there are special requirement for VCLK > 85Hz // #endif rSrc.left = rSrc.top = 0; rSrc.right = 320; rSrc.bottom = 240; rDest.left = rDest.top = 0; rDest.right = 1280; rDest.bottom = 960; lZoom = 1000; do { rDest.right = (320 * lZoom)/ 1000; rDest.bottom = (240 * lZoom)/1000; if (ppdev->pfnIsSufficientBandwidth(ppdev, 16, (LPRECTL) &rSrc, (LPRECTL) &rDest, 0)) { DISPDBG((1, "Minimum zoom factor: %d", lZoom)); pHalInfo->ddCaps.dwMinOverlayStretch = lZoom; pHalInfo->ddCaps.dwMinLiveVideoStretch = lZoom; pHalInfo->ddCaps.dwMinHwCodecStretch = lZoom; lZoom = 4000; } lZoom += 100; } while (lZoom < 4000); } } #endif // smac return(TRUE); } /******************************************************************************\ * * Function: DrvEnableDirectDraw * * Enable DirectDraw. This function is called when an application opens a * DirectDraw connection. * * Parameters: dhpdev Handle to physical device. * pCallBacks Pointer to DirectDraw callbacks. * pSurfaceCallBacks Pointer to surface callbacks. * pPaletteCallBacks Pointer to palette callbacks. * * Returns: TRUE if successful. * \******************************************************************************/ BOOL DrvEnableDirectDraw( DHPDEV dhpdev, DD_CALLBACKS* pCallBacks, DD_SURFACECALLBACKS* pSurfaceCallBacks, DD_PALETTECALLBACKS* pPaletteCallBacks) { PDEV* ppdev = (PPDEV) dhpdev; pCallBacks->WaitForVerticalBlank = DdWaitForVerticalBlank; pCallBacks->MapMemory = DdMapMemory; pCallBacks->GetScanLine = DdGetScanLine; pCallBacks->dwFlags = DDHAL_CB32_WAITFORVERTICALBLANK | DDHAL_CB32_MAPMEMORY | DDHAL_CB32_GETSCANLINE; pSurfaceCallBacks->Blt = DdBlt; pSurfaceCallBacks->Flip = DdFlip; pSurfaceCallBacks->Lock = DdLock; pSurfaceCallBacks->GetBltStatus = DdGetBltStatus; pSurfaceCallBacks->GetFlipStatus = DdGetFlipStatus; pSurfaceCallBacks->dwFlags = DDHAL_SURFCB32_BLT | DDHAL_SURFCB32_FLIP | DDHAL_SURFCB32_LOCK | DDHAL_SURFCB32_GETBLTSTATUS | DDHAL_SURFCB32_GETFLIPSTATUS; if (ppdev->flStatus & STAT_STREAMS_ENABLED) { pCallBacks->CreateSurface = DdCreateSurface; pCallBacks->CanCreateSurface = DdCanCreateSurface; pCallBacks->dwFlags |= DDHAL_CB32_CREATESURFACE | DDHAL_CB32_CANCREATESURFACE; pSurfaceCallBacks->SetColorKey = DdSetColorKey; pSurfaceCallBacks->UpdateOverlay = DdUpdateOverlay; pSurfaceCallBacks->SetOverlayPosition = DdSetOverlayPosition; pSurfaceCallBacks->DestroySurface = DdDestroySurface; pSurfaceCallBacks->dwFlags |= DDHAL_SURFCB32_SETCOLORKEY | DDHAL_SURFCB32_UPDATEOVERLAY | DDHAL_SURFCB32_SETOVERLAYPOSITION | DDHAL_SURFCB32_DESTROYSURFACE; // The DrvEnableDirectDraw call can occur while we're in full- // screen DOS mode. Do not turn on the streams processor now // if that's the case, instead wait until AssertMode switches // us back to graphics mode: } // Note that we don't call 'vGetDisplayDuration' here, for a couple of // reasons: // // o Because the system is already running, it would be disconcerting // to pause the graphics for a good portion of a second just to read // the refresh rate; // o More importantly, we may not be in graphics mode right now. // // For both reasons, we always measure the refresh rate when we switch // to a new mode. return(TRUE); } /******************************************************************************\ * * Function: DrvDisableDirectDraw * * Disable DirectDraw. This function is called when an application closes the * DirectDraw connection. * * Parameters: dhpdev Handle to physical device. * * Returns: Nothing. * \******************************************************************************/ VOID DrvDisableDirectDraw( DHPDEV dhpdev) { PDEV* ppdev; OH* poh; // DirectDraw is done with the display, so we can go back to using // all of off-screen memory ourselves. ppdev = (PPDEV) dhpdev; poh = ppdev->pohDirectDraw; if (poh) { DISPDBG((1, "Releasing DirectDraw surface %d x %d at (%d, %d)", poh->cx, poh->cy, poh->x, poh->y)); } pohFree(ppdev, poh); ppdev->pohDirectDraw = NULL; // Invalidate all cached fonts. vAssertModeText(ppdev, TRUE); } /******************************************************************************\ * * Function: vAssertModeDirectDraw * * Perform specific DirectDraw initialization when the screen switches focus * (from graphics to full screen MS-DOS and vice versa). * * Parameters: ppdev Pointer to physical device. * bEnabled True if the screen is in graphics mode. * * Returns: Nothing. * \******************************************************************************/ VOID vAssertModeDirectDraw( PDEV* ppdev, BOOL bEnabled) { } /******************************************************************************\ * * Function: bEnableDirectDraw * * Enable DirectDraw. Called from DrvEnableSurface. * * Parameters: ppdev Pointer to phsyical device. * * Returns: Nothing. * \******************************************************************************/ BOOL bEnableDirectDraw( PDEV* ppdev) { if (DIRECT_ACCESS(ppdev) && // Direct access must be enabled. #if (DIRECTX_24 < 1) (ppdev->cBpp != 3) && // Turn off DirectDraw in 24-bpp. #endif (ppdev->flCaps & CAPS_ENGINEMANAGED) && // Only support CL-GD5436/5446. (ppdev->flCaps & CAPS_MM_IO)) // Memory Mapped I/O must be on. { // We have to preserve the contents of the CR1B and CR1D registers on a // page flip. CP_OUT_BYTE(ppdev->pjPorts, CRTC_INDEX, 0x1B); ppdev->ulCR1B = (CP_IN_BYTE(ppdev->pjPorts, CRTC_DATA) & 0xF2) << 8; CP_OUT_BYTE(ppdev->pjPorts, CRTC_INDEX, 0x1D); ppdev->ulCR1D = (CP_IN_BYTE(ppdev->pjPorts, CRTC_DATA) & 0x7F) << 8; // Accurately measure the refresh rate for later. vGetDisplayDuration(ppdev); // DirectDraw is all set to be used on this card. ppdev->flStatus |= STAT_DIRECTDRAW; #if 1 // sge EnableStartAddrDoubleBuffer(ppdev); #endif // sge } return(TRUE); } /******************************************************************************\ * * Function: vDisableDirectDraw * * Disbale DirectDraw. Called from DrvDisableSurface. * * Parameters: ppdev Pointer to physical device. * * Returns: Nothing. * \******************************************************************************/ VOID vDisableDirectDraw( PDEV* ppdev) { } #if 1 // OVERLAY #sge /******************************************************************************\ * * Function: GetFormatInfo * * Get DirectDraw information, * * Parameters: ppdev Pointer to physical device. * * Returns: Nothing. * \******************************************************************************/ VOID GetFormatInfo(PDEV* ppdev, LPDDPIXELFORMAT lpFormat, LPDWORD lpFourcc, LPWORD lpBitCount) { if (lpFormat->dwFlags & DDPF_FOURCC) { *lpFourcc = lpFormat->dwFourCC; if (lpFormat->dwFourCC == BI_RGB) { *lpBitCount = (WORD) lpFormat->dwRGBBitCount; #ifdef DEBUG if (lpFormat->dwRGBBitCount == 8) { DISPDBG((1, "Format: RGB 8")); } else if (lpFormat->dwRGBBitCount == 16) { DISPDBG ((1,"Format: RGB 5:5:5")); } #endif } else if (lpFormat->dwFourCC == BI_BITFIELDS) { if ((lpFormat->dwRGBBitCount != 16) || (lpFormat->dwRBitMask != 0xf800) || (lpFormat->dwGBitMask != 0x07e0) || (lpFormat->dwBBitMask != 0x001f)) { *lpFourcc = (DWORD) -1; } else { *lpBitCount = 16; DISPDBG((1,"Format: RGB 5:6:5")); } } else { lpFormat->dwRBitMask = (DWORD) -1; lpFormat->dwGBitMask = (DWORD) -1; lpFormat->dwBBitMask = (DWORD) -1; if (lpFormat->dwFourCC == FOURCC_PACKJR) { *lpBitCount = 8; DISPDBG((1, "Format: CLJR")); } else if (lpFormat->dwFourCC == FOURCC_YUY2) { *lpBitCount = 16; DISPDBG((1,"Format: YUY2")); } else { *lpBitCount = 16; DISPDBG((1,"Format: UYVY")); } } } else if (lpFormat->dwFlags & DDPF_RGB) { if (lpFormat->dwRGBBitCount == 8) { *lpFourcc = BI_RGB; DISPDBG((1, "Format: RGB 8")); } else if ((lpFormat->dwRGBBitCount == 16) && (lpFormat->dwRBitMask == 0xf800) && (lpFormat->dwGBitMask == 0x07e0) && (lpFormat->dwBBitMask == 0x001f)) { *lpFourcc = BI_BITFIELDS; DISPDBG((1,"Format: RGB 5:6:5")); } else if ((lpFormat->dwRGBBitCount == 16) && (lpFormat->dwRBitMask == 0x7C00) && (lpFormat->dwGBitMask == 0x03e0) && (lpFormat->dwBBitMask == 0x001f)) { *lpFourcc = BI_RGB; DISPDBG((1,"Format: RGB 5:5:5")); } else if (((lpFormat->dwRGBBitCount == 24) || (lpFormat->dwRGBBitCount == 32)) && (lpFormat->dwRBitMask == 0xff0000) && (lpFormat->dwGBitMask == 0x00ff00) && (lpFormat->dwBBitMask == 0x0000ff)) { *lpFourcc = BI_RGB; DISPDBG((1, "Format: RGB 8:8:8")); } else { *lpFourcc = (DWORD) -1; } *lpBitCount = (WORD) lpFormat->dwRGBBitCount; } else if (ppdev->cBitsPerPixel == 16) { *lpFourcc = BI_RGB; *lpBitCount = (WORD) lpFormat->dwRGBBitCount; } else { *lpFourcc = (DWORD) -1; } } /********************************************************** * * Name: RegInitVideo * * Module Abstract: * ---------------- * This function is called to program the video format and * the physicall offset of the video data in the frame buffer. * * Output Parameters: * ------------------ * none * *********************************************************** * Author: Shuhua Ge * Date: 09/24/96 * * Revision History: * ----------------- * WHO WHEN WHAT/WHY/HOW * --- ---- ------------ * *********************************************************/ VOID RegInitVideo(PDEV* ppdev, PDD_SURFACE_LOCAL lpSurface) { DWORD dwTemp; DWORD dwFourcc; LONG lPitch; LONG lLeft; WORD wTemp; WORD wBitCount = 0; RECTL rVideoRect; BYTE bRegCR31; BYTE bRegCR32; BYTE bRegCR33; BYTE bRegCR34; BYTE bRegCR35; BYTE bRegCR36; BYTE bRegCR37; BYTE bRegCR38; BYTE bRegCR39; BYTE bRegCR3A; BYTE bRegCR3B; BYTE bRegCR3C; BYTE bRegCR3D; BYTE bRegCR3E; BYTE bRegCR5C; BYTE bRegCR5D; BYTE bTemp; DWORD dwTemp1; BOOL bOverlayTooSmall = FALSE; BYTE* pjPorts = ppdev->pjPorts; /* * Determine the format of the video data */ if (lpSurface->dwFlags & DDRAWISURF_HASPIXELFORMAT) { GetFormatInfo(ppdev, &(lpSurface->lpGbl->ddpfSurface), &dwFourcc, &wBitCount); } else { // This needs to be changed when primary surface is RGB 5:6:5 dwFourcc = BI_RGB; wBitCount = (WORD) ppdev->cBitsPerPixel; } rVideoRect = ppdev->rOverlayDest; lPitch = lpSurface->lpGbl->lPitch; /* * Determine value in CR31 (Horizontal Zoom Code) */ if ((ppdev->rOverlayDest.right - ppdev->rOverlayDest.left) == (ppdev->rOverlaySrc.right - ppdev->rOverlaySrc.left)) { /* * No zooming is occuring */ bRegCR31 = 0; } else { /* * The zoom code = (256 * ) / */ dwTemp = (DWORD) ((DWORD) (ppdev->rOverlaySrc.right - ppdev->rOverlaySrc.left)) * 256; if (ppdev->bDoubleClock) { dwTemp <<= 1; } dwTemp1= (DWORD) (ppdev->rOverlayDest.right - ppdev->rOverlayDest.left); dwTemp= ((2 * dwTemp) + dwTemp1) / (2*dwTemp1); bRegCR31= (BYTE) dwTemp; } /* * Determine value in CR32 (Vertical Zoom Code) */ if ((ppdev->rOverlayDest.bottom - ppdev->rOverlayDest.top) == (ppdev->rOverlaySrc.bottom - ppdev->rOverlaySrc.top)) { /* * No zooming is occuring */ bRegCR32 = 0; } else { /* * The zoom code = (256 * ) / * The -1 is so that it won't mangle the last line by mixing it * with garbage data while Y interpolating. */ dwTemp = (DWORD) ((DWORD) ((ppdev->rOverlaySrc.bottom - 1) - ppdev->rOverlaySrc.top)) * 256; dwTemp /= (DWORD) (ppdev->rOverlayDest.bottom - ppdev->rOverlayDest.top); bRegCR32 = (BYTE) dwTemp; } /* * Determine value in CR33 (Region 1 Size) */ wTemp = (WORD) rVideoRect.left; if (ppdev->cBitsPerPixel == 8) { wTemp >>= 2; // 4 Pixels per DWORD } else if (ppdev->cBitsPerPixel == 16) { wTemp >>= 1; // 2 Pixels per DWORD } else if (ppdev->cBitsPerPixel == 24) { wTemp *= 3; wTemp /= 4; } bRegCR33 = (BYTE) wTemp; bRegCR36 = (BYTE) (WORD) (wTemp >> 8); /* * Determine value in CR34 (Region 2 size) */ wTemp = (WORD) (rVideoRect.right - rVideoRect.left); if (ppdev->cBitsPerPixel == 8) { wTemp >>= 2; // 4 Pixels per DWORD } else if (ppdev->cBitsPerPixel == 16) { wTemp >>= 1; // 2 Pixels per DWORD } else if (ppdev->cBitsPerPixel == 24) { wTemp *= 3; wTemp /= 4; } bRegCR34 = (BYTE) wTemp; wTemp >>= 6; bRegCR36 |= (BYTE) (wTemp & 0x0C); /* * Determine value in CR35 (Region 2 SDSize) */ dwTemp = (DWORD) (rVideoRect.right - rVideoRect.left); dwTemp *= (DWORD) (ppdev->rOverlaySrc.right - ppdev->rOverlaySrc.left); dwTemp /= (DWORD) (ppdev->rOverlayDest.right - ppdev->rOverlayDest.left); wTemp = (WORD) dwTemp; if ((dwFourcc == FOURCC_PACKJR) || (wBitCount == 8)) { wTemp >>= 2; // 4 Pixels per DWORD } else { wTemp >>= 1; // 2 Pixels per DWORD } bRegCR35 = (BYTE) wTemp; wTemp >>= 4; bRegCR36 |= (BYTE) (wTemp & 0x30); // // Check double scan line counter feature // CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x17); bTemp = CP_IN_BYTE(pjPorts, CRTC_DATA); if (bTemp & 0x04) { // // Double scan line count // /* * Determine value in CR37 (Vertical Start) */ wTemp = (WORD) rVideoRect.top; bRegCR37 = (BYTE)(wTemp >> 1); if ( wTemp & 0x01 ) { wTemp >>= 9; bRegCR39 = (BYTE) wTemp | 0x10; // // Odd scan line trigger // Hardware has a bug now. // So reduce dest end by 1 // wTemp = (WORD) rVideoRect.bottom - 1 - 1; } else { wTemp >>= 9; bRegCR39 = (BYTE) wTemp; /* * Determine value in CR38 (Vertical End) */ wTemp = (WORD) rVideoRect.bottom - 1; } bRegCR38 = (BYTE)(wTemp >> 1); if (wTemp & 0x01) bRegCR39 |= 0x20; wTemp >>= 7; bRegCR39 |= (BYTE) (wTemp & 0x0C); } else { /* * Determine value in CR37 (Vertical Start) */ wTemp = (WORD) rVideoRect.top; bRegCR37 = (BYTE) wTemp; wTemp >>= 8; bRegCR39 = (BYTE) wTemp; /* * Determine value in CR38 (Vertical End) */ wTemp = (WORD) rVideoRect.bottom - 1; bRegCR38 = (BYTE) wTemp; wTemp >>= 6; bRegCR39 |= (BYTE) (wTemp & 0x0C); } /* * Determine values in CR3A, CR3B, CR3C (Start Address) */ dwTemp = 0; if (bRegCR31 != 0) { // // overlay is zoomed, re-initialize zoom factor // CalculateStretchCode(ppdev->rOverlaySrc.right - ppdev->rOverlaySrc.left, ppdev->rOverlayDest.right - ppdev->rOverlayDest.left, ppdev->HorStretchCode); } // // Here, we want to ensure the source rectangle's clipped width is bigger // than what the HW can support, sigh! // if (!bOverlayTooSmall) { LONG lSrcPels; // // compute non-clip amount on right edge // lSrcPels = rVideoRect.right - rVideoRect.left; if (bRegCR31 != 0) // source is zoomed if non-zero { WORD wRightCnt; wRightCnt = 0; while (lSrcPels > 0) { lSrcPels -= ppdev->HorStretchCode[wRightCnt]; if (lSrcPels >= 0) { wRightCnt++; } } lSrcPels = (LONG)wRightCnt; } if ((lSrcPels == 0) || (lSrcPels <= MIN_OLAY_WIDTH)) { bOverlayTooSmall = TRUE; } } lLeft = ppdev->rOverlaySrc.left; if (dwFourcc == FOURCC_PACKJR) { lLeft &= ~0x03; } else if (dwFourcc == FOURCC_YUV422 || dwFourcc == FOURCC_YUY2 ) { lLeft &= ~0x01; } // // dwTemp has adjusted dest. rect., add in source adjustment // dwTemp += (ppdev->rOverlaySrc.top * lPitch) + ((lLeft * wBitCount) >>3); ppdev->sOverlay1.lAdjustSource = dwTemp; // dwTemp += ((BYTE*)lpSurface->lpGbl->fpVidMem - ppdev->pjScreen); // sss dwTemp += (DWORD)(lpSurface->lpGbl->fpVidMem); bRegCR5D = (BYTE) ((dwTemp << 2) & 0x0C); dwTemp >>= 2; bRegCR3A = (BYTE) dwTemp & 0xfe; // Align to even byte (5446 bug) dwTemp >>= 8; bRegCR3B = (BYTE) dwTemp; dwTemp >>= 8; bRegCR3C = (BYTE) (dwTemp & 0x0f); /* * Determine value in CR3D (Address Offset/Pitch) */ wTemp = (WORD) (lPitch >> 3); if (lpSurface->dwReserved1 & OVERLAY_FLG_DECIMATE) { wTemp >>= 1; } bRegCR3D = (BYTE) wTemp; wTemp >>= 3; bRegCR3C |= (BYTE) (wTemp & 0x20); /* * Determine value in CR3E (Master Control Register) */ bRegCR3E = 0; if (lpSurface->dwReserved1 & OVERLAY_FLG_ENABLED) { bRegCR3E = 0x01; } if (dwFourcc == FOURCC_PACKJR) { bRegCR3E |= 0x20; // Always error difuse when using PackJR } if ((bRegCR32 == 0) || MustLineReplicate (ppdev, lpSurface, wBitCount)) { bRegCR3E |= 0x10; lpSurface->dwReserved1 &= ~OVERLAY_FLG_INTERPOLATE; } else { lpSurface->dwReserved1 |= OVERLAY_FLG_INTERPOLATE; } if (dwFourcc == FOURCC_PACKJR) { bRegCR3E |= 0x02; } else if (dwFourcc == BI_RGB) { if (wBitCount == 16) { bRegCR3E |= 0x08; } else if (wBitCount == 8) { bRegCR3E |= 0x04; } } else if (dwFourcc == BI_BITFIELDS) { bRegCR3E |= 0x0A; } /* * If we are color keying, we will set that up now */ if (lpSurface->dwReserved1 & OVERLAY_FLG_COLOR_KEY) { bRegCR3E |= 0x80; CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x1a); bTemp = CP_IN_BYTE(pjPorts, CRTC_DATA); // Set CR1A[3:2] to timing ANDed w/ color bTemp &= ~0x0C; CP_OUT_BYTE(pjPorts, CRTC_DATA, bTemp); CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x1d); // Clear CR1D[5:4] bTemp = CP_IN_BYTE(pjPorts, CRTC_DATA); if (ppdev->cBitsPerPixel == 8) { CP_OUT_BYTE(pjPorts, CRTC_DATA, bTemp & ~0x38); CP_OUT_WORD(pjPorts, INDEX_REG, (ppdev->wColorKey << 8) | 0x0c); // Output color to GRC CP_OUT_WORD(pjPorts, INDEX_REG, 0x0d); // Output color to GRD } else { CP_OUT_BYTE(pjPorts, CRTC_DATA, (bTemp & ~0x30) | 0x08); CP_OUT_WORD(pjPorts, INDEX_REG, (ppdev->wColorKey << 8) | 0x0c); // Output color to GRC CP_OUT_WORD(pjPorts, INDEX_REG, (ppdev->wColorKey & 0xff00) | 0x0d);// Output color to GRD } } else if (lpSurface->dwReserved1 & OVERLAY_FLG_SRC_COLOR_KEY) { BYTE bYMax, bYMin, bUMax, bUMin, bVMax, bVMin; bRegCR3E |= 0x80; CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x1a); bTemp = CP_IN_BYTE(pjPorts, CRTC_DATA); // Set CR1A[3:2] to timing ANDed w/ color bTemp &= ~0x0C; CP_OUT_BYTE(pjPorts, CRTC_DATA, bTemp); CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x1d); // Set CR1D[5:4] to 10 CP_OUT_BYTE(pjPorts, CRTC_DATA, CP_IN_BYTE(pjPorts, CRTC_DATA) | 0x20); /* * Determine min/max values */ if ((dwFourcc == FOURCC_YUV422) || (dwFourcc == FOURCC_YUY2) || (dwFourcc == FOURCC_PACKJR)) { bYMax = (BYTE)(DWORD)(ppdev->dwSrcColorKeyHigh >> 16); bYMin = (BYTE)(DWORD)(ppdev->dwSrcColorKeyLow >> 16); bUMax = (BYTE)(DWORD)((ppdev->dwSrcColorKeyHigh >> 8) & 0xff); bUMin = (BYTE)(DWORD)((ppdev->dwSrcColorKeyLow >> 8) & 0xff); bVMax = (BYTE)(ppdev->dwSrcColorKeyHigh & 0xff); bVMin = (BYTE)(ppdev->dwSrcColorKeyLow & 0xff); if (dwFourcc == FOURCC_PACKJR) { bYMax |= 0x07; bUMax |= 0x03; bVMax |= 0x03; bYMin &= ~0x07; bUMin &= ~0x03; bVMin &= ~0x03; } } else if ((dwFourcc == 0) && (wBitCount == 16)) { /* * RGB 5:5:5 */ bYMax = (BYTE)(DWORD)((ppdev->dwSrcColorKeyHigh >> 7) & 0xF8); bYMin = (BYTE)(DWORD)((ppdev->dwSrcColorKeyLow >> 7) & 0xF8); bUMax = (BYTE)(DWORD)((ppdev->dwSrcColorKeyHigh >> 2) & 0xF8); bUMin = (BYTE)(DWORD)((ppdev->dwSrcColorKeyLow >> 2) & 0xF8); bVMax = (BYTE)(ppdev->dwSrcColorKeyHigh << 3); bVMin = (BYTE)(ppdev->dwSrcColorKeyLow << 3); bYMax |= 0x07; bUMax |= 0x07; bVMax |= 0x07; } else if (dwFourcc == BI_BITFIELDS) { /* * RGB 5:6:5 */ bYMax = (BYTE)(DWORD)((ppdev->dwSrcColorKeyHigh >> 8) & 0xF8); bYMin = (BYTE)(DWORD)((ppdev->dwSrcColorKeyLow >> 8) & 0xF8); bUMax = (BYTE)(DWORD)((ppdev->dwSrcColorKeyHigh >> 3) & 0xFC); bUMin = (BYTE)(DWORD)((ppdev->dwSrcColorKeyLow >> 3) & 0xFC); bVMax = (BYTE)(ppdev->dwSrcColorKeyHigh << 3); bVMin = (BYTE)(ppdev->dwSrcColorKeyLow << 3); bYMax |= 0x07; bUMax |= 0x03; bVMax |= 0x07; } CP_OUT_WORD(pjPorts, INDEX_REG, ((WORD)bYMin << 8) | 0x0C); // GRC CP_OUT_WORD(pjPorts, INDEX_REG, ((WORD)bYMax << 8) | 0x0D); // GRD CP_OUT_WORD(pjPorts, INDEX_REG, ((WORD)bUMin << 8) | 0x1C); // GR1C CP_OUT_WORD(pjPorts, INDEX_REG, ((WORD)bUMax << 8) | 0x1D); // GR1D CP_OUT_WORD(pjPorts, INDEX_REG, ((WORD)bVMin << 8) | 0x1E); // GR1E CP_OUT_WORD(pjPorts, INDEX_REG, ((WORD)bVMax << 8) | 0x1F); // GR1F } else { CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x1a); bTemp = CP_IN_BYTE(pjPorts, CRTC_DATA); // Clear CR1A[3:2] CP_OUT_BYTE(pjPorts, CRTC_DATA, bTemp & ~0x0C); } /* * Set up alignment info */ if (ppdev->cBitsPerPixel != 24) { WORD wXAlign; WORD wXSize; if (ppdev->cBitsPerPixel == 8) { wXAlign = (WORD)rVideoRect.left & 0x03; wXSize = (WORD)(rVideoRect.right - rVideoRect.left) & 0x03; } else { wXAlign = (WORD)(rVideoRect.left & 0x01) << 1; wXSize = (WORD)((rVideoRect.right - rVideoRect.left) & 0x01) << 1; } bRegCR5D |= (BYTE) (wXAlign | (wXSize << 4)); } else { bRegCR5D = 0; } /* * Set up the FIFO threshold value. Make sure that the value we use is * not less than the default value. */ CP_OUT_BYTE(pjPorts, SR_INDEX, 0x16); bTemp = CP_IN_BYTE(pjPorts, SR_DATA) & 0x0f; if (bTemp > (ppdev->lFifoThresh & 0x0f)) { ppdev->lFifoThresh = bTemp; } if (ppdev->lFifoThresh < 0x0f) { ppdev->lFifoThresh++; // Eliminates possible errata } bRegCR5C = 0x10 | ((BYTE) ppdev->lFifoThresh & 0x0f); /* * Now start programming the registers */ CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR31 << 8) | 0x31); // CR31 CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR32 << 8) | 0x32); // CR32 if (lpSurface->dwReserved1 & OVERLAY_FLG_YUVPLANAR) { CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) 0x10 << 8) | 0x3F); // CR3F } CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR5C << 8) | 0x5C); // CR5C // // disable overlay if overlay is too small to be supported by HW // if (bOverlayTooSmall) { bRegCR3E &= ~0x01; // disable overlay ppdev->dwPanningFlag |= OVERLAY_OLAY_REENABLE; // totally clipped } else { CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR33 << 8) | 0x33); // CR33 CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR34 << 8) | 0x34); // CR34 CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR35 << 8) | 0x35); // CR35 CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR36 << 8) | 0x36); // CR36 // CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR37 << 8) | 0x37); // CR37 CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR38 << 8) | 0x38); // CR38 CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR39 << 8) | 0x39); // CR39 CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR3A << 8) | 0x3A); // CR3A CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR3B << 8) | 0x3B); // CR3B CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR3C << 8) | 0x3C); // CR3C CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR3D << 8) | 0x3D); // CR3D CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR5D << 8) | 0x5D); // CR5D // // Write Vertical start first // CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR37 << 8) | 0x37); // CR37 } CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR3E << 8) | 0x3E); // CR3E } /********************************************************** * Name: DisableOverlay_544x * * Module Abstract: * ---------------- * This is called when an overlay window is totally clipped by * the panning viewport. **********************************************************/ VOID DisableOverlay_544x(PDEV* ppdev) { WORD wCR3E; BYTE* pjPorts = ppdev->pjPorts; ppdev->dwPanningFlag |= OVERLAY_OLAY_REENABLE; CP_OUT_BYTE(pjPorts, CRTC_INDEX,0x3e); //Video Window Master Control wCR3E = CP_IN_WORD(pjPorts, CRTC_INDEX) & ~0x100; //clear bit one CP_OUT_WORD(pjPorts, CRTC_INDEX, wCR3E); //disable overlay window } /********************************************************** * Name: EnableOverlay_544x * * Module Abstract: * ---------------- * Show the overlay window. **********************************************************/ VOID EnableOverlay_544x(PDEV* ppdev) { WORD wCR3E; BYTE* pjPorts = ppdev->pjPorts; ppdev->dwPanningFlag &= ~OVERLAY_OLAY_REENABLE; CP_OUT_BYTE(pjPorts, CRTC_INDEX,0x3e); //Video Window Master Control wCR3E = CP_IN_WORD(pjPorts, CRTC_INDEX) | 0x100; //clear bit one CP_OUT_WORD(pjPorts, CRTC_INDEX, wCR3E); //disable overlay window } /********************************************************** * * Name: ClearAltFIFOThreshold_544x * * Module Abstract: * ---------------- * * * Output Parameters: * ------------------ * none * *********************************************************** * Author: Shuhua Ge * Date: 02/03/97 * * Revision History: * ----------------- * WHO WHEN WHAT/WHY/HOW * --- ---- ------------ * *********************************************************/ VOID ClearAltFIFOThreshold_544x(PDEV * ppdev) { UCHAR bTemp; BYTE* pjPorts = ppdev->pjPorts; DISPDBG((1, "ClearAltFIFOThreshold")); CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x5c); // Clear Alt FIFO Threshold bTemp = CP_IN_BYTE(pjPorts, CRTC_DATA); CP_OUT_BYTE(pjPorts, CRTC_DATA, bTemp & ~0x10); } /********************************************************** * * Name: RegMoveVideo * * Module Abstract: * ---------------- * This function is called to move the video window that has * already been programed. * * Output Parameters: * ------------------ * none * *********************************************************** * Author: Shuhua Ge * Date: 09/25/96 * * Revision History: * ----------------- * WHO WHEN WHAT/WHY/HOW * --- ---- ------------ * *********************************************************/ VOID RegMoveVideo(PDEV* ppdev, PDD_SURFACE_LOCAL lpSurface) { BOOL bZoomX; DWORD dwTemp; DWORD dwFourcc; LONG lLeft; LONG lPitch; WORD wTemp; WORD wBitCount = 0; RECTL rVideoRect; BYTE bRegCR33; BYTE bRegCR34; BYTE bRegCR35; BYTE bRegCR36; BYTE bRegCR37; BYTE bRegCR38; BYTE bRegCR39; BYTE bRegCR3A; BYTE bRegCR3B; BYTE bRegCR3C; BYTE bRegCR3D; BYTE bRegCR5D; BYTE bTemp; BYTE* pjPorts = ppdev->pjPorts; /* * Determine the format of the video data */ if (lpSurface->dwFlags & DDRAWISURF_HASPIXELFORMAT) { GetFormatInfo(ppdev, &(lpSurface->lpGbl->ddpfSurface), &dwFourcc, &wBitCount); } else { // This needs to be changed when primary surface is RGB 5:6:5 dwFourcc = BI_RGB; wBitCount = (WORD) ppdev->cBitsPerPixel; } rVideoRect = ppdev->rOverlayDest; // // rVideoRect is now adjusted and clipped to the panning viewport. // Disable overlay if totally clipped by viewport. // if (((rVideoRect.right - rVideoRect.left) <= 0) || ((rVideoRect.bottom- rVideoRect.top ) <= 0)) { DisableOverlay_544x(ppdev); // #ew1 cannot display below min. overlay size return; } lPitch = lpSurface->lpGbl->lPitch; /* * Determine value in CR33 (Region 1 Size) */ wTemp = (WORD) rVideoRect.left; if (ppdev->cBitsPerPixel == 8) { wTemp >>= 2; // 4 Pixels per DWORD } else if (ppdev->cBitsPerPixel == 16) { wTemp >>= 1; // 2 Pixels per DWORD } else if (ppdev->cBitsPerPixel == 24) { wTemp *= 3; wTemp /= 4; } bRegCR33 = (BYTE) wTemp; bRegCR36 = (BYTE) (WORD) (wTemp >> 8); /* * Determine value in CR34 (Region 2 size) */ wTemp = (WORD) (rVideoRect.right - rVideoRect.left); if (ppdev->cBitsPerPixel == 8) { wTemp >>= 2; // 4 Pixels per DWORD } else if (ppdev->cBitsPerPixel == 16) { wTemp >>= 1; // 2 Pixels per DWORD } else if (ppdev->cBitsPerPixel == 24) { wTemp *= 3; wTemp /= 4; } bRegCR34 = (BYTE) wTemp; wTemp >>= 6; bRegCR36 |= (BYTE) (wTemp & 0x0C); /* * Determine value in CR35 (Region 2SD Size) */ dwTemp = (DWORD) (rVideoRect.right - rVideoRect.left); dwTemp *= (DWORD) (ppdev->rOverlaySrc.right - ppdev->rOverlaySrc.left); dwTemp /= (DWORD) (ppdev->rOverlayDest.right - ppdev->rOverlayDest.left); wTemp = (WORD) dwTemp; if ((dwFourcc == FOURCC_PACKJR) || (wBitCount == 8)) { wTemp >>= 2; // 4 Pixels per DWORD } else { wTemp >>= 1; // 2 Pixels per DWORD } bRegCR35 = (BYTE) wTemp; wTemp >>= 4; bRegCR36 |= (BYTE) (wTemp & 0x30); // // Check double scan line counter feature // CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x17); bTemp = CP_IN_BYTE(pjPorts, CRTC_DATA); if (bTemp & 0x04) { // // Double scan line count // /* * Determine value in CR37 (Vertical Start) */ wTemp = (WORD) rVideoRect.top; bRegCR37 = (BYTE)(wTemp >> 1); if ( wTemp & 0x01 ) { wTemp >>= 9; bRegCR39 = (BYTE) wTemp | 0x10; // // Odd scan line trigger // Hardware has a bug now. // So reduce dest end by 1 // wTemp = (WORD) rVideoRect.bottom - 1 - 1; } else { wTemp >>= 9; bRegCR39 = (BYTE) wTemp; /* * Determine value in CR38 (Vertical End) */ wTemp = (WORD) rVideoRect.bottom - 1; } bRegCR38 = (BYTE)(wTemp >> 1); if (wTemp & 0x01) bRegCR39 |= 0x20; wTemp >>= 7; bRegCR39 |= (BYTE) (wTemp & 0x0C); } else { /* * Determine value in CR37 (Vertical Start) */ wTemp = (WORD) rVideoRect.top; //if (ppdev->bDoubleClock) //{ // wTemp >>= 1; //} bRegCR37 = (BYTE) wTemp; wTemp >>= 8; bRegCR39 = (BYTE) wTemp; /* * Determine value in CR38 (Vertical End) */ wTemp = (WORD) rVideoRect.bottom - 1; //if (ppdev->bDoubleClock) //{ // wTemp >>= 1; //} bRegCR38 = (BYTE) wTemp; wTemp >>= 6; bRegCR39 |= (BYTE) (wTemp & 0x0C); } /* * Determine values in CR3A, CR3B, CR3C (Start Address) */ dwTemp = 0; bZoomX = ((ppdev->rOverlayDest.right - ppdev->rOverlayDest.left) != (ppdev->rOverlaySrc.right - ppdev->rOverlaySrc.left)); if (bZoomX) { // // overlay is zoomed, re-initialize zoom factor // CalculateStretchCode(ppdev->rOverlaySrc.right - ppdev->rOverlaySrc.left, ppdev->rOverlayDest.right - ppdev->rOverlayDest.left, ppdev->HorStretchCode); } // // Here, we want to ensure the source rectangle's clipped width is bigger // than what the HW can support, sigh! // // if (grOverlayDest.right > sData->rViewport.right) { int iSrcPels; // // compute non-clip amount on right edge // iSrcPels = (int)(rVideoRect.right - rVideoRect.left); if (bZoomX) { WORD wRightCnt; wRightCnt = 0; while (iSrcPels > 0) { iSrcPels -= ppdev->HorStretchCode[wRightCnt]; if (iSrcPels >= 0) { wRightCnt++; } } iSrcPels = (int)wRightCnt; } if ((iSrcPels == 0) || (iSrcPels <= MIN_OLAY_WIDTH)) { DisableOverlay_544x(ppdev); // cannot display below min. overlay size return; } } lLeft = ppdev->rOverlaySrc.left; if (dwFourcc == FOURCC_PACKJR) { lLeft &= ~0x03; } else if (dwFourcc == FOURCC_YUV422 || dwFourcc == FOURCC_YUY2) { lLeft &= ~0x01; } // // #ew1 dwTemp has adjusted dest. rect., add in source adjustment // dwTemp += (ppdev->rOverlaySrc.top * lPitch) + ((lLeft * wBitCount) >>3); ppdev->sOverlay1.lAdjustSource = dwTemp; // dwTemp += ((BYTE*)lpSurface->lpGbl->fpVidMem - ppdev->pjScreen); // sss dwTemp += (DWORD)(lpSurface->lpGbl->fpVidMem); bRegCR5D = (BYTE) ((dwTemp << 2) & 0x0C); dwTemp >>= 2; bRegCR3A = (BYTE) dwTemp & 0xfe; // Align to even byte (5446 bug) dwTemp >>= 8; bRegCR3B = (BYTE) dwTemp; dwTemp >>= 8; bRegCR3C = (BYTE) (dwTemp & 0x0f); /* * Determine value in CR3D (Address Offset/Pitch) */ wTemp = (WORD) (lPitch >> 3); if (lpSurface->dwReserved1 & OVERLAY_FLG_DECIMATE) { wTemp >>= 1; } bRegCR3D = (BYTE) wTemp; wTemp >>= 3; bRegCR3C |= (BYTE) (wTemp & 0x20); /* * Set up alignment info */ if (ppdev->cBitsPerPixel != 24) { WORD wXAlign; WORD wXSize; if (ppdev->cBitsPerPixel == 8) { wXAlign = (WORD)rVideoRect.left & 0x03; wXSize = (WORD)(rVideoRect.right - rVideoRect.left) & 0x03; } else { wXAlign = (WORD)(rVideoRect.left & 0x01) << 1; wXSize = (WORD)((rVideoRect.right - rVideoRect.left) & 0x01) << 1; } bRegCR5D |= (BYTE) (wXAlign | (wXSize << 4)); } /* * Now we will write the actual register values. */ CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR33 << 8) | 0x33); // CR33 CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR34 << 8) | 0x34); // CR34 CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR35 << 8) | 0x35); // CR35 CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR36 << 8) | 0x36); // CR36 CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR38 << 8) | 0x38); // CR38 CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR39 << 8) | 0x39); // CR39 CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR3A << 8) | 0x3A); // CR3A CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR3B << 8) | 0x3B); // CR3B CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR3C << 8) | 0x3C); // CR3C CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR3D << 8) | 0x3D); // CR3D CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR5D << 8) | 0x5D); // CR5D CP_OUT_WORD(pjPorts, CRTC_INDEX, ((WORD) bRegCR37 << 8) | 0x37); // CR37 if (ppdev->dwPanningFlag & OVERLAY_OLAY_REENABLE) EnableOverlay_544x(ppdev); } /********************************************************** * * Name: CalculateStretchCode * * Module Abstract: * ---------------- * This code was originally written by Intel and distributed * with the DCI development kit. * * This function takes the zoom factor and determines exactly * how many times we need to replicate each row/column. * * Output Parameters: * ------------------ * none * *********************************************************** * Author: Intel * Date: ??/??/?? * * Revision History: * ----------------- * WHO WHEN WHAT/WHY/HOW * --- ---- ------------ * Scott MacDonald 10/06/94 Incorporated code into DCI provider. * *********************************************************/ VOID CalculateStretchCode (LONG srcLength, LONG dstLength, LPBYTE code) { LONG dwDeltaX, dwDeltaY, dwConst1, dwConst2, dwP; LONG i, j, k; BYTE bStretchIndex = 0; LONG total = 0; /* * for some strange reason I'd like to figure out but haven't got time to, the * replication code generation seems to have a problem between 1:1 and 2:1 stretch * ratios. Fix is to zero-initialize index (the problem occurs in the first one * generated) when stretch is betw. those ratios, and one-initialize it otherwise. */ if ((dstLength <= srcLength * 2L) && (dstLength >= srcLength)) { bStretchIndex = 0; } else { bStretchIndex = 1; } /* * initialize code array, to get rid of anything which might have been * left over in it. */ for (i = 0; i < srcLength; i++) { code[i] = 0; } /* * Variable names roughly represent what you will find in any graphics * text. Consult text for an explanation of Bresenham line alg., it's * beyond the scope of my comments here. */ dwDeltaX = srcLength; dwDeltaY = dstLength; if (dstLength < srcLength) { /* * Size is shrinking, use standard Bresenham alg. */ dwConst1 = 2L * dwDeltaY; dwConst2 = 2L * (dwDeltaY - dwDeltaX); dwP = 2L * dwDeltaY - dwDeltaX; for (i = 0; i < dwDeltaX; i++) { if (dwP <= 0L) { dwP += dwConst1; } else { dwP += dwConst2; code[i]++; total++; } } } else { /* * Size is increasing. Use Bresenham adapted for slope > 1, and * use a loop invariant to generate code array. Run index i from * 0 to dwDeltaY - 1, and when i = dwDeltaY - 1, j will * be = dwDeltaX - 1. */ dwConst1 = 2L * dwDeltaX; dwConst2 = 2L * (dwDeltaX - dwDeltaY); dwP = 2L * dwDeltaX - dwDeltaY; j = 0; for (i = 0; i < dwDeltaY; i++) { if (dwP <= 0L) { dwP += dwConst1; bStretchIndex++; } else { dwP += dwConst2; code[j++] = ++bStretchIndex; bStretchIndex = 0; total += (int)code[j - 1]; } } /* * UGLY fix up for wacky bug which I have no time to fix properly. * The 'total' of entries is messed up for slopes > 4, so add the * difference back into the array. */ if (total < dwDeltaY) { while (total < dwDeltaY) { j = (int)dwDeltaY - total; k = (int)dwDeltaY / j; for (i = 0; i < dwDeltaX; i++) { if (!(i % k) && (total < dwDeltaY)) { code[i]++; total++; } } } } } } /********************************************************** * * Name: GetThresholdValue * * Module Abstract: * ---------------- * Determines the best threshold for the specified * surface. * * Output Parameters: * ------------------ * Threshold * *********************************************************** * Author: Shuhua Ge * Date: 09/25/95 * * Revision History: * ----------------- * WHO WHEN WHAT/WHY/HOW * --- ---- ------------ * *********************************************************/ BYTE GetThresholdValue(VOID) { return ((BYTE) 0x0A); } /********************************************************** * * Name: MustLineRelicate * * Module Abstract: * ---------------- * Checks to see if we must line replicate or if we can * interpolate. * * Output Parameters: * ------------------ * TRUE/FALSE * *********************************************************** * Author: Shuhua Ge * Date: 09/25/96 * * Revision History: * ----------------- * WHO WHEN WHAT/WHY/HOW * --- ---- ------------ * *********************************************************/ BOOL MustLineReplicate (PDEV* ppdev, PDD_SURFACE_LOCAL lpSurface, WORD wVideoDepth) { LONG lTempThresh; /* * If we are double clocking the data (1280x1024 mode), we must * replicate. We should also always replicate in Performance mode */ if (ppdev->bDoubleClock) { return (TRUE); } // // Check the VCLK // // sge07 if (GetVCLK(ppdev) > 130000) { return (TRUE); } /* * If we are using the chroma key feature, we can't interpolate */ if (lpSurface->dwReserved1 & (OVERLAY_FLG_COLOR_KEY | OVERLAY_FLG_SRC_COLOR_KEY)) { return (TRUE); } lTempThresh = ppdev->lFifoThresh; if (ppdev->pfnIsSufficientBandwidth(ppdev, wVideoDepth, &ppdev->rOverlaySrc, &ppdev->rOverlayDest, OVERLAY_FLG_INTERPOLATE)) { ppdev->lFifoThresh = lTempThresh; return (FALSE); } ppdev->lFifoThresh = lTempThresh; return (TRUE); } /********************************************************** * * Name: IsSufficientBandwidth * * Module Abstract: * ---------------- * Determines is sufficient bandwidth exists for the requested * configuration. * * Output Parameters: * ------------------ * TRUE/FALSE * It also sets the global parameter lFifoThresh, which gets * programed in RegInitVideo(). * *********************************************************** * Author: Shuhua Ge * Date: 09/25/96 * * Revision History: * ----------------- * WHO WHEN WHAT/WHY/HOW * --- ---- ------------ * *********************************************************/ BOOL IsSufficientBandwidth(PDEV* ppdev, WORD wVideoDepth, LPRECTL lpSrc, LPRECTL lpDest, DWORD dwFlags) { LONG lVideoPixelsPerDWORD; LONG lGraphicsPixelsPerDWORD; LONG lVCLKPeriod; LONG lTransferTime; LONG lDWORDsWritten; LONG lZoom; LONG lReadPeriod; LONG lEffReadPeriod; LONG lWritePeriod; LONG lEffWritePeriod; LONG K1,K2; LONG lTrFifoAFirst4; LONG lTrFifoB2; LONG lDWORDsRead; LONG lFifoAReadPeriod; LONG lFifoBReadPeriod; LONG lFifoAEffWritePeriod; LONG lFifoBEffWritePeriod; LONG lFifoALevels; LONG lFifoBLevels; LONG lFifoAThresh; LONG lFifoBThresh; LONG lVCLK; BYTE* pjPorts = ppdev->pjPorts; //#define BLIT_LATENCY 8 #define CRT_FIFO_DEPTH 28 // // Add 8 clock for BLT_LATENCY for 54446BE and later chips // // sge04 LONG BLIT_LATENCY = 8; if (ppdev->flCaps & CAPS_SECOND_APERTURE) BLIT_LATENCY += 2; /* * Convert input parameters */ if (wVideoDepth == 16) { lVideoPixelsPerDWORD = 2; } else { lVideoPixelsPerDWORD = 4; } if (ppdev->cBitsPerPixel == 8) { lGraphicsPixelsPerDWORD = 4; } else if (ppdev->cBitsPerPixel == 16) { lGraphicsPixelsPerDWORD = 2; } else if (ppdev->cBitsPerPixel == 24) { lGraphicsPixelsPerDWORD = 1; } else return (FALSE); lZoom = ((lpDest->right - lpDest->left) * 256) / (lpSrc->right - lpSrc->left); /* * If we are double clocked, fail if we are not zoomed at least 2X */ if (ppdev->bDoubleClock && (lZoom < 512)) { return (FALSE); } /* * We need to get the VCLK every time since this can change * at run-time */ lVCLK = GetVCLK(ppdev); if (lVCLK == 0) { return (FALSE); } lVCLKPeriod = (LONG) ((1000000/lVCLK) + 1); /* * We only need to setup the following variables once! */ if (!ppdev->lBusWidth) { /* * We will read the bus width from SR0F[4:3] */ CP_OUT_BYTE(pjPorts, SR_INDEX, 0x0F); if ((CP_IN_BYTE(pjPorts, SR_DATA) & 0x18) == 0x18) { ppdev->lBusWidth = 8; // 64 bit bus } else { ppdev->lBusWidth = 4; // 32 bit bus } } if (!ppdev->lRandom) { /* * Is this EDO or regular? */ CP_OUT_BYTE(pjPorts, SR_INDEX, 0x0f); if (!(CP_IN_BYTE(pjPorts, SR_DATA) & 0x4)) { ppdev->lRandom = 7; ppdev->lPageMiss = 7; } else { ppdev->lRandom = 6; ppdev->lPageMiss = 6; } } if (!ppdev->lMCLKPeriod) { LONG lMCLK; /* * The MCLK period is the amount of time required for one cycle. * We will round up. */ CP_OUT_BYTE(pjPorts, SR_INDEX, 0x1f); // First get the MCLK frequency lMCLK = CP_IN_BYTE(pjPorts, SR_DATA); lMCLK *= 14318; lMCLK >>= 3; ppdev->lMCLKPeriod = ((1000000/lMCLK) + 1); } /* * Check for the case with no color key or Y interpolation */ if (dwFlags == 0) { /* * This mode utilizes only FIFO A. The fifo is filled with * graphics data during regions 1 and 3, and video data during * region 2. * * The normal memory sequence for this mode goes as follows. * * ------------------------------------------------ * | cpu/blit cycle | FIFO A fill | cpu/blit cycle .... * ------------------------------------------------ * * The cpu/blit cycle is interrupted when the CRT * fifo is depleted to its threshold. Once the * crt cycle is started, it continues until the * FIFO A is full. * * Worst case condition for filling the CRT fifo : * * 1) CPU/blit latency -> * 2) Random cycle for region 2 video -> * 3) Page miss for region 2 video -> * 4) Page miss for region 2 to region 3 transition -> * 5) Page miss for region 3 graphics * * Conditions 3 and 5 depend on the location of the * graphic screen within display memory. For 1024x768, where * the graphics screen starts at location 0 and is offset by * 1024 or 2048 bytes each line, condition 5 is never met. * If a video window starts at beginning of a memory page, * and is offset at the beggining of each line by an even * multiple of a memory page, condition 3 is never met. * * Based on this worst case condition, the amount of time * required to complete 4 transfers into the crt fifo * is approximately: * lTransferTime = (BLIT_LATENCY + lRandom + 3*(lPageMiss)) * * lMCLKPeriod. * the number of dwords transferred to the fifo * during this time is 4 for 32 bit memory interface * or 8 for 64 bit interface. * lDWORDsWritten = 4 * (lBusWidth/4) * * During this period, data continues to be read from the crt * fifo for screen refresh. The amount of data read, * assuming a 1x scale is approximately: * lDWORDsRead = tr_time/(lVideoPixelsPerDWORD * lVCLKPeriod) * * The difference between the dwords read and dwords * written must be accounted for in the fifo trheshold setting * * lFifoThresh = (lDWORDsRead - lDWORDsWritten) rounded * up to next even value. * * To determine if there is adequate bandwidth to support * the mode, the lFifoThresh must not exceed the fifo depth. * For the mode to work, the fifo read rate must not exceed the * fifo write rate. * read_rate = min(lGraphicsPixelsPerDWORD,lVideoPixelsPerDWORD) * lVCLKPeriod. * write_rate = lMCLKPeriod * 2; -- 2 clocks per cas * * A special case occurs if the fifo read rate is very close to the peak * fifo write rate. In this case the crt fill may result in a continuous * page cycle for the entire active line. This could result in 1 extra * page miss at the start of region2. To account for this, I will * add 3 DWORDS to the trheshold if the read and write rates are very close * (arbitrarily defined as within 10% of each other. * * Zooming * Some modes can only be supported at video scale factors greater than 1X. * Even when the video is zoomed, a small number of dwords must be read * from the crt fifo at the unzoomed rate in order to prime the video * pipeline. The video pipeline requires 10 pixel before it slows the fifo * reads to the zoomed rate. * * tr_time - (lVCLKPeriod * 10/lVideoPixelsPerDWORD) * lDWORDsRead = --------------------------------------------- + 10/lVideoPixelsPerDWORDord * (lVideoPixelsPerDWORD * lVCLKPeriod * lZoom) */ lTransferTime = (BLIT_LATENCY + ppdev->lRandom + (3*(ppdev->lPageMiss))) * ppdev->lMCLKPeriod; lDWORDsWritten = 3 * (ppdev->lBusWidth/4); /* * If read rate exceeds write rate, calculate minumum zoom * to keep everything as ints, spec the zoom as 256 times * the fractional zoom */ lWritePeriod = ppdev->lMCLKPeriod * 2/(ppdev->lBusWidth/4); lReadPeriod = lVideoPixelsPerDWORD * lVCLKPeriod; /* * Pick worst case of graphics and video depths for calculation * of dwords read. This may be a little pessimistic for the * when the graphics bits per pixel exceeds the video bits per pixel. */ lEffReadPeriod = (lVideoPixelsPerDWORD * lVCLKPeriod * lZoom)/256; if (lEffReadPeriod < lWritePeriod) { /* * Cannot support overlay at this zoom factor */ return (0); } if (lGraphicsPixelsPerDWORD > lVideoPixelsPerDWORD) // handle zoom factor { lDWORDsRead = ((lTransferTime - (lVCLKPeriod * 10/lVideoPixelsPerDWORD))/ (lEffReadPeriod)) + (10 / lVideoPixelsPerDWORD) + 1; } else { lDWORDsRead = (lTransferTime/ (lGraphicsPixelsPerDWORD * lVCLKPeriod)) + 1; } // Calculate the fifo threshold setting ppdev->lFifoThresh = lDWORDsRead - lDWORDsWritten; // if read rate is within 10% of write rate, up by 3 dwords if ((11*lEffReadPeriod) < ((10*lWritePeriod*256)/lZoom)) { ppdev->lFifoThresh += 3; } // fifo trheshold spec'd in QWORDS, so round up by 1 and divide by 2) ppdev->lFifoThresh = (ppdev->lFifoThresh + 1)/2; // Add a extra QWORD to account for fifo level sync logic ppdev->lFifoThresh = ppdev->lFifoThresh + 1; if (ppdev->bDoubleClock) { ppdev->lFifoThresh <<= 1; } if ((ppdev->lFifoThresh >= CRT_FIFO_DEPTH) || ((lEffReadPeriod) < lWritePeriod)) { return (0); } else { return (1); } } /* * Check bandwidth for Y Interpolation */ else if (dwFlags & OVERLAY_FLG_INTERPOLATE) { /* * This mode utilizes both FIFOs A and B. During horizontal blank, * both fifos are filled. FIFO a is then filled with graphics * data during regions 1 and 3, and video data during region 2. * FIFO B is filled with video data during region 2, and is idle * during regions 1 and 3. * * The normal memory sequence for this mode goes as follows. * * ---------------------------------------------------------------- * | cpu/blit cycle | FIFO A fill | FIFO B fill | cpu/blit cycle . * ---------------------------------------------------------------- * or * ---------------------------------------------------------------- * | cpu/blit cycle | FIFO B fill | FIFO A fill | cpu/blit cycle . * ---------------------------------------------------------------- * * For this mode, the FIFO threshold must be set high enough to allow * enough time to abort the cpu/blt, fill FIFO A, then transfer data * into FIFO B before underflow occurs. * * Worst case condition for filling the CRT fifo : * * 1) CPU/blit latency -> * 2) FIFO A random cycle for region 2 video -> * 3) FIFO A page miss for region 2 video -> * 4) FIFO A page miss for region 2 to region 3 transition -> * 5) FIFO A page miss for region 3 graphics * 6) FIFO A page mode fill * 7) FIFO B random cycle * 8) FIFO B page miss * * lTransferTime = lMCLKPeriod * * (BLIT_LATENCY + lRandom + 3*(lPageMiss) + * fifoa_remaining + * lRandom + lPageMiss; * * * The time required to fill FIFO A depends upon the read rate * of FIFO A and the number of levels that must be filled, * as determined by the threshold setting. * * The worst case fill time for the first four levels of fifo A is * lTrFifoAFirst4 = (BLIT_LATENCY + lRandom + 3*(lPageMiss)) * * lMCLKPeriod; * * The number of dwords depleted from fifo A during the * fill of the first four levels is * lReadPeriod = lVCLKPeriod * lVideoPixelsPerDWORD * lZoom; * fifoa_reads_4 = lTrFifoAFirst4/lReadPeriod; * * The number of empty levels remaining in the fifo after * the fill of the first four levels is * fifoa_remaining = FIFO_DEPTH - lFifoThresh + ((4*ramwidth)/4) * - lTrFifoAFirst4/lReadPeriod; * * The amount of time required to fill the remaining levels of * fifo A is determined by the write rate and the read rate. * lWritePeriod = lMCLKPeriod * 2; // 2 clks per cas * lEffWritePeriod = ((lReadPeriod * lWritePeriod)/ * (lReadPeriod - lWritePeriod)); * * tr_fifoa_remaining = fifoa_remaining * lEffWritePeriod; * * * The total amount of time for the cpu/blt latency and the * fifo A fill is * tr_fifoa_total = lTrFifoAFirst4 + tr_fifoa_remaining; * * The worse case fill time for fifo B is as follows: * lTrFifoB2 = (lRandom + lPageMiss) * lMCLKPeriod; * * The total amount of time elapsed from the crt request until * the first 2 fifob cycles are completed is * lTransferTime = tr_fifoa_total + lTrFifoB2; * * The number of dwords transferred to the fifo during this * time is 2 for 32 bit memory interface or 4 for 64 bit interface. * lDWORDsWritten = 2 * (lBusWidth/4) * * During this period, data continues to be read from the crt * fifo B for screen refresh. The amount of data read, * is approximately: * dwords_read = lTransferTime/lReadPeriod * * The difference between the dwords read and dwords * written must be accounted for in the fifo trheshold setting * * lFifoThresh = (dwords_read - lDWORDsWritten) rounded * up to next even value. * * Since the lTransferTime and dwords_read depends on * the threshold setting, a bit of algebra is required to determine * the minimum setting to prevent fifo underflow. * * lFifoThresh = (lTransferTime/lReadPeriod) - lDWORDsWritten; * = ((tr_fifoa_4 + lTrFifoB2 + tr_fifoa_remaining)/lReadPeriod) * - lDWORDsWritten * to simplify calcuation, break out constant part of equation * K1 = ((tr_fifoa_4 + lTrFifoB2)/lReadPeriod) - lDWORDsWritten; * * lFifoThresh = K1 + (tr_fifoa_remaining/lReadPeriod); * = K1 + (fifoa_remaining * lEffWritePeriod)/lReadPeriod; * lFifoThresh = K1 + * ((FIFO_DEPTH - lFifoThresh + 4 - (lTrFifoAFirst4/lReadPeriod)) * * lEffWritePeriod)/lReadPeriod; * * break out another constant to simplify reduction * K2 = (FIFO_DEPTH + 4 - (lTrFifoAFirst4/lReadPeriod)) * * (lEffWritePeriod/lReadPeriod); * lFifoThresh = K1 + K2 - (lFifoThresh * (lEffWritePeriod/lReadPeriod)); * lFifoThresh * (1 + (lEffWritePeriod/lReadPeriod)) = K1 + K2; * lFifoThresh = (K1 + K2)/(1 + (lEffWritePeriod/lReadPeriod); * * Once the threshold setting is determined, another calculation must * be performed to determine if available bandwidth exists given the * zoom factor. The worst case is assumed to be when FIFO A and * FIFO B reach the threshold point at the same time. The sequence * is then to abort the cpu/blt, fill fifo a, then fill fifo b. * * Since FIFO A is full when the fill B operation starts, I only have * to determine how long it takes to fill FIFO B and then calculate * the the number of dwords read from A during that time. * * lTransferTime = (lTrFifoB2 + (CRT_FIFO_DEPTH * lEffWritePeriod))/lReadPeriod; * lFifoALevels = CRT_FIFO_DEPTH - (lTransferTime/lReadPeriod); * * if lFifoALevels < 1, then underflow condition may occur. */ if (lZoom < 512) { // 5446 requires at least a 2X zoom for Y interpolation return (FALSE); } lWritePeriod = ppdev->lMCLKPeriod * 2/(ppdev->lBusWidth/4); lReadPeriod = (lVideoPixelsPerDWORD * lVCLKPeriod * lZoom)/256; lEffWritePeriod = ((lReadPeriod * lWritePeriod)/ (lReadPeriod - lWritePeriod)); lTrFifoAFirst4 = (BLIT_LATENCY + ppdev->lRandom + 3*(ppdev->lPageMiss)) * ppdev->lMCLKPeriod; lTrFifoB2 = (ppdev->lRandom + ppdev->lPageMiss) * ppdev->lMCLKPeriod; lDWORDsWritten = 2 * (ppdev->lBusWidth/4); K1 = ((lTrFifoAFirst4 + lTrFifoB2)/lReadPeriod) - lDWORDsWritten; K2 = (CRT_FIFO_DEPTH + (4*(ppdev->lBusWidth/4)) - (lTrFifoAFirst4/lReadPeriod)) * (lEffWritePeriod/lReadPeriod); ppdev->lFifoThresh = (1 + ((K1 + K2)/(1 + (lEffWritePeriod/lReadPeriod)))); ppdev->lFifoThresh += 3; lTransferTime = (lTrFifoB2 + (CRT_FIFO_DEPTH * lEffWritePeriod)); lFifoALevels = ((CRT_FIFO_DEPTH - (lTransferTime/lReadPeriod))/2); if (ppdev->bDoubleClock) { ppdev->lFifoThresh <<= 1; } if ((lFifoALevels < 2) || (ppdev->lFifoThresh > (CRT_FIFO_DEPTH/2))) { return (0); } else { return (1); } } /* * Check bandwidth for color keying */ else if (dwFlags & (OVERLAY_FLG_COLOR_KEY | OVERLAY_FLG_SRC_COLOR_KEY)) { /* * This mode utilizes both FIFOs A and B. During horizontal blank, * both fifos are filled. FIFO a is then filled with graphics data * during regions 1,2 and 3. FIFO B is filled with video data * during region 2, and is idle during regions 1 and 3. * * The normal memory sequence for this mode goes as follows. * * ---------------------------------------------------------------- * | cpu/blit cycle | FIFO A fill | FIFO B fill | cpu/blit cycle . * ---------------------------------------------------------------- * or * ---------------------------------------------------------------- * | cpu/blit cycle | FIFO B fill | FIFO A fill | cpu/blit cycle . * ---------------------------------------------------------------- * * For this mode, the FIFO threshold must be set high enough to allow * enough time to abort the cpu/blt, fill FIFO A, then transfer data * into FIFO B before underflow occurs. If the fifob read rate is * greater than the fifoa read rate, then allow eough time for * a t CPU/blt abort, followed by a fifo B fill, then a FIFO A fill. * * Worst case condition for filling the CRT fifo : * * 1) CPU/blit latency -> * 2) FIFO A random -> * 3) FIFO A page miss -> * 6) FIFO A page mode fill --> * 7) FIFO B random --> * 8) FIFO B page miss * * or * * 1) CPU/blit latency -> * 2) FIFO B random -> * 3) FIFO A page miss -> * 6) FIFO A page mode fill --> * 7) FIFO B random --> * 8) FIFO B page miss * * * 1) lTransferTime = lMCLKPeriod * * (BLIT_LATENCY + lRandom + lPageMiss + * fifoa_remaining + * lRandom + lPageMiss; * * or * 2) lTransferTime = lMCLKPeriod * * (BLIT_LATENCY + lRandom + lPageMiss + * fifob_remaining + * lRandom + lPageMiss; * * * lFifoAReadPeriod = lVCLKPeriod * lGraphicsPixelsPerDWORD; * lFifoBReadPeriod = (lVCLKPeriod * lVideoPixelsPerDWORD * lZoom)*256; * * if (lFifoAReadPeriod > lFifoBReadPeriod), then * first fifo is fifo B, otherwise first is fifo A. * The followinf euqations are written for a fifoa->fifob, * sequence, but the fifob->fifoa sequence can be obtained simply * by swapping the fifo read periods. * * The time required to fill a FIFO depends upon the read rate * of the FIFO and the number of levels that must be filled, * as determined by the threshold setting. * * The worst case fill time for the first four levels of fifo A is * lTrFifoAFirst4 = (BLIT_LATENCY + lRandom + lPageMiss) * * lMCLKPeriod; * * The number of dwords depleted from fifo A during the * fill of the first four levels is * fifoa_reads_4 = lTrFifoAFirst4/lFifoAReadPeriod; * * The number of empty levels remaining in the fifo after * the fill of the first four levels is * fifoa_remaining = FIFO_DEPTH - lFifoThresh + ((4*ramwidth)/4) * - lTrFifoAFirst4/lFifoAReadPeriod; * * The amount of time required to fill the remaining levels of * fifo A is determined by the write rate and the read rate. * lWritePeriod = lMCLKPeriod * 2; * 2 clks per cas * eff_write_period = ((lFifoAReadPeriod * lWritePeriod)/ * (lFifoAReadPeriod - lWritePeriod)); * * tr_fifoa_remaining = fifoa_remaining * eff_write_period; * * * The total amount of time for the cpu/blt latency and the * fifo A fill is * tr_fifoa_total = lTrFifoAFirst4 + tr_fifoa_remaining; * * The worse case fill time for fifo B is as follows: * lTrFifoB2 = (lRandom + lPageMiss) * lMCLKPeriod; * * The total amount of time elapsed from the crt request until * the first 2 fifob cycles are completed is * lTransferTime = tr_fifoa_total + lTrFifoB2; * * The number of dwords transferred to the fifo during this time * is 2 for 32 bit memory interface or 4 for 64 bit interface. * lDWORDsWritten = 2 * (lBusWidth/4) * * During this period, data continues to be read from the crt * fifo B for screen refresh. The amount of data read, * is approximately: * lFifoBReadPeriod = (lVCLKPeriod * lVideoPixelsPerDWORD * lZoom)/256; * dwords_read = lTransferTime/lFifoBReadPeriod * * The difference between the dwords read and dwords * written must be accounted for in the fifo trheshold setting * * lFifoThresh = (dwords_read - lDWORDsWritten) rounded * up to next even value. * * Since the lTransferTime and dwords_read depends on the * threshold setting, a bit of algebra is required to determine * the minimum setting to prevent fifo underflow. * * lFifoThresh = (lTransferTime/lFifoBReadPeriod) - lDWORDsWritten; * = ((tr_fifoa_4 + lTrFifoB2 + tr_fifoa_remaining)/lFifoBReadPeriod) * - lDWORDsWritten * to simplify calcuation, break out constant part of equation * K1 = ((tr_fifoa_4 + lTrFifoB2)/lFifoBReadPeriod) - lDWORDsWritten; * * lFifoThresh = K1 + (tr_fifoa_remaining/lFifoBReadPeriod); * = K1 + (fifoa_remaining * eff_write_period)/lFifoBReadPeriod; * lFifoThresh = K1 + * ((FIFO_DEPTH - lFifoThresh + 4 - (lTrFifoAFirst4/lFifoAReadPeriod)) * * eff_write_period)/read_period; * * break out another constant to simplify reduction * K2 = (FIFO_DEPTH + 4 - (lTrFifoAFirst4/lFifoAReadPeriod)) * * (eff_write_period/lFifoBReadPeriod); * lFifoThresh = K1 + K2 - (lFifoThresh * (eff_write_period/lFifoBReadPeriod)); * lFifoThresh * (1 + (eff_write_period/read_period)) = K1 + K2; * lFifoThresh = (K1 + K2)/(1 + (eff_write_period/lFifoBReadPeriod); * * Once the threshold setting is determined, another calculation must * be performed to determine if available bandwidth exists given the * zoom factor. The worst case is assumed to be when FIFO A and * FIFO B reach the threshold point at the same time. The sequence * is then to abort the cpu/blt, fill fifo a, then fill fifo b. * * Since FIFO A is full when the fill B operation starts, I only have * to determine how long it takes to fill FIFO B and then calculate * the the number of dwords read from A during that time. * * lTransferTime = (lTrFifoB2 + (CRT_FIFO_DEPTH * fifob_eff_write_period))/read_period; * fifoa_levels = CRT_FIFO_DEPTH - (lTransferTime/read_period); * * if fifoa_levels < 1, then underflow condition may occur. */ lWritePeriod = ppdev->lMCLKPeriod * 2/(ppdev->lBusWidth/4); lFifoAReadPeriod = lGraphicsPixelsPerDWORD * lVCLKPeriod; lFifoBReadPeriod = (lVideoPixelsPerDWORD * lVCLKPeriod * lZoom)/256; if (lFifoAReadPeriod <= lWritePeriod) // this fails, so set a big# { lFifoAEffWritePeriod = 5000; } else { lFifoAEffWritePeriod = ((lFifoAReadPeriod * lWritePeriod)/ (lFifoAReadPeriod - lWritePeriod)); } if (lFifoBReadPeriod <= lWritePeriod) // this fails, so set a big# { lFifoBEffWritePeriod = 5000; } else { lFifoBEffWritePeriod = ((lFifoBReadPeriod * lWritePeriod)/ (lFifoBReadPeriod - lWritePeriod)); } if ((lFifoAReadPeriod == 0) || (lFifoBReadPeriod == 0) || (lWritePeriod == 0)) { return (FALSE); } // These values should be the same for bot the fifoa->fifob // and fifob->fifoa sequences lTrFifoAFirst4 = (BLIT_LATENCY + ppdev->lRandom + 2*(ppdev->lPageMiss)) * ppdev->lMCLKPeriod; lTrFifoB2 = (ppdev->lRandom + ppdev->lPageMiss) * ppdev->lMCLKPeriod; lDWORDsWritten = 2 * (ppdev->lBusWidth/4); // Since I'm not sure which sequence is worse // Try both then pick worse case results // For fifoa->fifob sequence K1 = ((lTrFifoAFirst4 + lTrFifoB2)/lFifoBReadPeriod) - lDWORDsWritten; K2 = (CRT_FIFO_DEPTH + (4*(ppdev->lBusWidth/4)) - (lTrFifoAFirst4/lFifoAReadPeriod)) * (lFifoAEffWritePeriod/lFifoBReadPeriod); lFifoAThresh = (1 + ((K1 + K2)/ (1 + (lFifoAEffWritePeriod/lFifoBReadPeriod)))); lFifoAThresh += 3; lTransferTime = (lTrFifoB2 + (CRT_FIFO_DEPTH * lFifoBEffWritePeriod)); lFifoALevels = ((CRT_FIFO_DEPTH - (lTransferTime/lFifoAReadPeriod))/2); // For fifob->fifoa sequence K1 = ((lTrFifoAFirst4 + lTrFifoB2)/lFifoAReadPeriod) - lDWORDsWritten; K2 = (CRT_FIFO_DEPTH + (4*(ppdev->lBusWidth/4)) - (lTrFifoAFirst4/lFifoBReadPeriod)) * (lFifoBEffWritePeriod/lFifoAReadPeriod); lFifoBThresh = (1 + ((K1 + K2)/ (1 + (lFifoBEffWritePeriod/lFifoAReadPeriod)))); lFifoBThresh += 3; lTransferTime = (lTrFifoB2 + (CRT_FIFO_DEPTH * lFifoAEffWritePeriod)); lFifoBLevels = ((CRT_FIFO_DEPTH - (lTransferTime/lFifoBReadPeriod))/2); if (lFifoAThresh > lFifoBThresh) { ppdev->lFifoThresh = lFifoAThresh; } else { ppdev->lFifoThresh = lFifoBThresh; } if (ppdev->bDoubleClock) { ppdev->lFifoThresh <<= 1; } if ((lFifoBLevels <0) || (lFifoALevels < 0) || (ppdev->lFifoThresh > (CRT_FIFO_DEPTH/2))) { return (0); } else { return (1); } } return (1); // Should never get here!! } // chu03 /********************************************************** * * Name: Is5480SufficientBandwidth * * Module Abstract: * ---------------- * This function reads the current MCLK, VLCK, bus width, etc. * and determines whether the chip has sufficient bandwidth * to handle the requested mode. * * Output Parameters: * ------------------ * none * ***********************************************************/ // ------------------------------------------------------------- // Overview by John Schafer // ------------------------------------------------------------- // The memory arbitration scheme for the 5480 has changed // significantly from the 5446. The 5480 is set up on a first // come, first serve basis. If more than 1 request arrive at // the same clock edge, then the BankSelect is used to determine // which request to acknowledge first. Using SDRAM, the row // access to a differennt bank can be hidden, which saves up to // 7 MCLKs. If all bank selects for the concurrent requests are // the same, the default prority is FIFOA->FIFOB->FIFOC->VCAP. // // The FIFO sizes for the 5480 are as follows: // FIFOA, FIFOB, FIFOC : 32x64 // VCAP : 16x64 (two 8x64 fifos) // // The Y interpolation mode for the 5480 is "free" due to // the embedded line store. The available mode combinations // for the 5480 which effect bandwidth are : // // 1) Capture enabled, 1 video window, no occlusion, not 420 format // 2) Capture enabled, 1 video window, no occlusion, 420 format // 3) Capture enabled, 1 video window, occlusion, not 420 format // 4) Capture enabled, 1 video window, occlusion, 420 format // 5) Capture enabled, 2 video windows (occlusion implied) // 6) Capture disabled, 1 video window, no occlusion, not 420 format // 7) Capture disabled, 1 video window, no occlusion, 420 format // 8) Capture disabled, 1 video window, occlusion, not 420 format // 9) Capture disabled, 1 video window, occlusion, 420 format // 10) Capture disabled, 2 video windows (occlusion implied) // // // ------------------------------------------------------------- // FIFO threshold description // ------------------------------------------------------------- // The memory requests are generated based on the threshold settings // of each FIFO. CRT FIFO thresholds during non-video window lines // are determined by SR16(3:0). CRT FIFO thresholds during video // window lines are determined by CR5C(3:0). // The VCAP fifo threshold is a fixed setting of 8 QWORDS (half). // // The 4 bit threshold for FIFOs A,B, and C indicate the FIFO // level in double QWORDS at which the FIFO request is asserted. // For example, a setting of 4 indicates that the request is // generated when the FIFO level is reduced to 8 QWORDS. // A setting of 0 is a special case which indicates that the // FIFO must be full to prevent a request (i.e. 32 QWORDS). // // The objective of the bandwidth equations is to calculate // the optimum threshold setting and determine which display // modes may be supported for given MCLK and VCLK frequencies. // // The critical parameters which determine the bandwidth limits // are the read and effective write rates for each FIFO. // // ------------------------------------------------------------- // FIFO read/write rates for CRT FIFOs // ------------------------------------------------------------- // The read rate for FIFO A (graphics FIFO) is determined by // the graphics pixel depth and the VCLK frequency. // fa_read_rate = gr_bytes_per_pixel * vclk_period // // The read rates for FIFO B and C are determined differently // depending on display mode. For 420 format the read periods // in nanosecs per byte are as follows: // fb_read_period = ((vclk_period*4) * hzoom) / hdecimate; // fc_read_period = ((vclk_period*4) * hzoom) / hdecimate; // // In this equation hdecimate is specified as 1/decimation_scale, // i.e a 1/2 decimate implies hdecimate = 2 // // For non 420 format the rates are: // fb_read_period = ((vclk_period/vw_bytes_per_pixel) * hzoom) / // hdecimate; // fc_read_period = (vclk_period/vw_bytes_per_pixel); // // Since the FIFOs can be read and written simultaneously, // the effective write rate is determined by the actual fifo // write rate and tje fifo read rate. The actual write rate is based // on single mclk display memory reads. The memory read period is // calculated in terms of nanoseconds per byte. // // bytes_per_memory_transfer is equal to 4 for 32 bit i/f, 8 for 64 bit i/f // mem_read_period = mclk_period/bytes_per_mem_transfer // fa_eff_write_period = (mem_read_period * fa_read_period)/ // (fa_read_period - mem_read_period); // fb_eff_write_period = (mem_read_period * fb_read_period)/ // (fb_read_period - mem_read_period); // fc_eff_write_period = (mem_read_period * fc_read_period)/ // (fc_read_period - mem_read_period); // ------------------------------------------------------------- // FIFO read/write rates for VCAP fifo // ------------------------------------------------------------- // The video capture write rate is based on the data rate // from the video capture interface. Since the video capture // interface can perform format conversion (e.g. 422->PackJR) and // decimation, the capture data rate may be smaller than the actual // video port data rate. The capture period in the following equation // is defined in terms of nanoseconds per byte. The decimation factor // may vary from 1 to 1/256. // // vcap_write_period = (vport_pixel_period/capture_bytes_per_pixel) * // (vport_decimation); // In this equation vport_decimation is specified as 1/decimation_scale, // i.e a 1/2 decimate implies vport_decimation = 2 // // // Since the VCAP fifo can be read and written simultaneously, // the effective read rate is determined by the fifo write rate as well // as the actual fifo read rate. The actual fifo read rate is based on two // memory clock cycle display memory writes. The calculations are in terms // of nanoseconds per byte. // bytes_per_memory_transfer = 4 for 32 bit i/f, or 8 for 64 bit i/f // mem_write_period = 2 * mclk_period/bytes_per_mem_transfer // // vcap_eff_read_period = (mem_write_period * vcap_write_period)/ // (vcap_write_period - mem_write_period); // // ------------------------------------------------------------------- // How to determine if FIFO ABC underflow or VCAP fifo overflow occurs // ------------------------------------------------------------------- // // I will examine a few worst case scenarios to determine if adequate // bandwidth exists to support a given mode. // // Case #1 - start of graphics line where all 3 CRT fifos must be filled // // This condition occurs after hsync when the 3 CRT FIFOs are being // prefilled before the start of the active line. The only risk here is // that the video capture fifo may overflow during the consecutive fills // of fifos A,B, and C. The threshold setting does not matter since the // CRT fifos are cleared on reset and thus guaranteed to be empty. // // For a 32 bit memory interface : // fabc_fill_time = (BLIT_LATENCY * mclk_period) + // 3 * ((RAS_PRECHARGE + 64) * mclk_period) // // For a 64 bit memory interface : // fabc_fill_time = (BLIT_LATENCY * mclk_period) + // 3 * ((RAS_PRECHARGE + 32) * mclk_period) // // A capture fifo overflow occurs if fabc_fill_time is greater than // VCAP fill time based on the worst case 30 MB/s capture rate. // // For a worst case memory interface scenario, let's assume a 32 bit // interface with a 66 MHz memory clock, a blit latency of 10 mclks, // and a ras precharge of 7 mclks. The fabc_fill_time is // then // fabc_fill_time = (10 * 15.2) + // 3 * ((64 + 7) * 15.2) = 3390 ns // // Assuming the worst case 30 MB/s capture rate, the number of // bytes written to the capture fifo during the fabc_fill_time is // 3390 ns * (1 byte/33 ns) = 103 bytes // // Since the capture fifo is 128 bytes deep, the worst case scenario // is OK so long as the capture fifo is emptied prior to the fabc_fill. // // // // Case #2 - Consecutive requests // // It seems that the worst case for servicing of requests is when the requests occur // on consecutive mclks with the order of requests being from the slowest to the // fastest data consumer. In other words, the first to be serviced is the capture fifo, // then the 3 CRT fifos in the order of decreasing read_period. // // First calculate actual and effective read and write periods as decribed above. // Then determine how many requests are active, this is a maximum of 4 if capture // is enabled and all 3 CRT fifos are enabled. Assume that the capture rate // is the slowest and thus is always serviced first. Then order the active // CRT requests as f1 through f3, where f1 has the longest read period and // f3 has the shortest. // // The sequence of events then becomes: // empty vcap -> fill 1 -> fill 2 -> fill 3 // // // Depending on the number of active crt fifos, the fill 2 and fill 3 operations may // be ommitted. The vcap empty is obviously ommitted if capture is not enabled. // // Now step through the sequence and verify that crt fifo underflows and capture // underflows do not occur. // // If capture is enabled, calculate the latency and empty times // vcap_latency = (BLIT_LATENCY + RAS_PRECHARGE) * mclk_period; // vcap_bytes_to_empty = CAP_FIFO_DEPTH; // vcap_empty_time = (vcap_read_period * vcap_bytes_to_empty); // Since one of the capture fifos continues to fill while the other is being // emptied, calculate the number of filled levels in the capture fifo at // the end of the memory transfer. // vcap_levels_remaining = (vcap_latency + vcap_empty_time)/vcap_write_period; // If the number of levels filled exceeds the fifo depth, then an overflow occurred. // // Note that the VCAP FIFO operates differently than the CRT fifos. The VCAP // FIFO operates as 2 8x64 FIFOs. A memory request is asserted when one of the // FIFOs is full. The capture interface then fills the other fifo while the // full fifo is being serviced by the sequencer. Using this method, the transfer // to memory is always 16 QWORDs for VCAP data (except special end of line conditions). // // Now check fifo 1. If capture was enabled then the latency for fifo 1 is: // f1_latency = vcap_latency + vcap_empty_time + // (BLIT_LATENCY + RAS_PRECHARGE) * mclk_period; // // otherwise the latency is: // f1_latency = (BLIT_LATENCY + RAS_PRECHARGE) * mclk_period; // // Calculate the number of empty levels in fifo 1, i.e. the number of bytes // that must be filled. // f1_bytes_to_fill = ((16-threshold) * 16) + (f1_latency/f1_read_period); // If the number of levels to be filled exceeds the fifo depth, then an underflow occurred. // Calculate the fill time based on the effective fifo write rate. // f1_fill_time = (f1_eff_write_period * f1_bytes_to_fill); // // If fifo_2 is active, calculate its latency and bytes to be filled. // f2_latency = f1_latency + f1_fill_time + // (RAS_PRECHARGE * mclk_period); // f2_bytes_to_fill = ((16-threshold) * 16) + (f2_latency/f2_read_period); // If the number of levels to be filled exceeds the fifo depth, then an underflow occurred. // Calculate the fill time based on the effective fifo write rate. // f2_fill_time = (f2_eff_write_period * f2_bytes_to_fill); // // If fifo_2 is active, calculate its latency and bytes to be filled. // f3_latency = f2_latency + f2_fill_time + // (RAS_PRECHARGE * mclk_period); // f3_bytes_to_fill = ((16-threshold) * 16) + (f3_latency/f3_read_period); // If the number of levels to be filled exceeds the fifo depth, then an underflow occurred. // Calculate the fill time based on the effective fifo write rate. // f3_fill_time = (f3_eff_write_period * f3_bytes_to_fill); // // Now go back to the start of sequence and make sure that none of the FIFOs // have already initiated another request. The totla latency is the amount // of time required to execute the entire sequence. // // Check vcap fif status if capture is enabled, // vcap_latency = total_latency; // vcap_bytes_to_empty = (total_latency/vcap_write_period); // // Check fifo 1 status // f1_latency = (total_latency - f1_latency - f1_fill_time); // f1_bytes_to_fill = (f1_latency/f1_read_period); // // Check fifo 2 status if active // f2_latency = (total_latency - f1_latency - f1_fill_time); // f3_bytes_to_fill = (f1_latency/f1_read_period); // //*************************************************************************** static BOOL Is5480SufficientBandwidth (PDEV* ppdev, WORD wVideoDepth, LPRECTL lpSrc, LPRECTL lpDest, DWORD dwFlags) { long lVideoPixelsPerDWORD; long lGraphicsPixelsPerDWORD; long lCapturePixelsPerDWORD; long lVideoBytesPerPixel; long lGraphicsBytesPerPixel; long lCaptureBytesPerPixel; long lVCLKPeriod; long lZoom; long lFifoAReadPeriod; long lFifoBReadPeriod; long lFifoCReadPeriod; long lFifoAEffWritePeriod; long lFifoBEffWritePeriod; long lFifoCEffWritePeriod; long lMemReadPeriod; long lVPortPixelPeriod; long lVCapReadPeriod; long lVCapWritePeriod; long lFifo1ReadPeriod; long lFifo2ReadPeriod; long lFifo3ReadPeriod; long lFifo1EffWritePeriod; long lFifo2EffWritePeriod; long lFifo3EffWritePeriod; long lVCapLatency; long lVCapBytesToEmpty; long lVCapEmptyTime; long lVCapLevelRemaining; long lFifo1Latency; long lFifo1BytesToFill; long lFifo1FillTime; long lFifo2Latency; long lFifo2BytesToFill; long lFifo2FillTime; long lFifo3Latency; long lFifo3BytesToFill; long lFifo3FillTime; long lThreshold; int CrtFifoCount; BOOL bCapture; BOOL bFifoAEnable; BOOL bFifoBEnable; BOOL bFifoCEnable; BOOL bModePass; long lHorizDecimate; long lVPortDecimate; long lTotalLatency; long lVCLK; UCHAR tempB ; BYTE* pjPorts = ppdev->pjPorts ; #define CAP_FIFO_DEPTH 64 #define RAS_PRECHARGE 7 #define BLIT_LATENCY 9 // // Parameter checking // lFifo2EffWritePeriod = 0; lFifo3EffWritePeriod = 0; lHorizDecimate = 1; lVPortDecimate = 1; // // Convert input parameters // if (wVideoDepth == 16) { lVideoPixelsPerDWORD = 2; lCapturePixelsPerDWORD = 2; } else if (wVideoDepth == 8) { lVideoPixelsPerDWORD = 4; lCapturePixelsPerDWORD = 4; } else return (FALSE); if (ppdev->cBitsPerPixel == 8) { lGraphicsPixelsPerDWORD = 4; } else if (ppdev->cBitsPerPixel == 16) { lGraphicsPixelsPerDWORD = 2; } else if (ppdev->cBitsPerPixel == 24) { lGraphicsPixelsPerDWORD = 1; } else return (FALSE); lGraphicsBytesPerPixel = 4 / lGraphicsPixelsPerDWORD; lVideoBytesPerPixel = 4 / lVideoPixelsPerDWORD; lCaptureBytesPerPixel = 4 / lCapturePixelsPerDWORD; lZoom = (lpDest->right - lpDest->left) / (lpSrc->right - lpSrc->left); if (lZoom < 1) lZoom = 1; // // We need to get the VCLK every time since this can change at run-time // lVCLK = GetVCLK(ppdev); lVCLKPeriod = (long) ((1024000000l/lVCLK) + 1); // // Video port at 13.5 MHz // lVPortPixelPeriod = (long) ((10240000) / 135); // // Graphics CRT FIFO read rate // lFifoAReadPeriod = lGraphicsBytesPerPixel * lVCLKPeriod; // // Video FIFO read rate // if(dwFlags & OVERLAY_FLG_YUVPLANAR) { lFifoBReadPeriod = ((lVCLKPeriod * 4) * lZoom) / lHorizDecimate; lFifoCReadPeriod = ((lVCLKPeriod * 4) * lZoom) / lHorizDecimate; } else { lFifoBReadPeriod = ((lVCLKPeriod / lVideoBytesPerPixel) * lZoom) / lHorizDecimate; lFifoCReadPeriod = lVCLKPeriod / lVideoBytesPerPixel; } DISPDBG ((2, "lFifoAReadPeriod = %ld, lFifoBReadPeriod=%ld\n", lFifoAReadPeriod, lFifoBReadPeriod)); DISPDBG ((2, "lFifoCReadPeriod = %ld\n", lFifoCReadPeriod)); // // Video capture write period // lVCapWritePeriod = (lVPortPixelPeriod / lCaptureBytesPerPixel) * lVPortDecimate; if (!ppdev->lBusWidth) { // // We will read the bus width from SR0F[4:3] // CP_OUT_BYTE (pjPorts, SR_INDEX, 0x0F) ; if ((CP_IN_BYTE(pjPorts, SR_DATA) & 0x18) == 0x18) ppdev->lBusWidth = 8; // 64 bit bus else ppdev->lBusWidth = 4; // 32 bit bus } if (!ppdev->lMCLKPeriod) { LONG lMCLK; // // The MCLK period is the amount of time required for one cycle. // We will round up. // CP_OUT_BYTE (pjPorts, SR_INDEX, 0x1F) ; // First get the MCLK frequency lMCLK = CP_IN_BYTE(pjPorts, SR_DATA); lMCLK *= 14318; lMCLK >>= 3; ppdev->lMCLKPeriod = (long) ((1024000000l/lMCLK) + 1); } // // Calculate CRT effective read and write periods // lMemReadPeriod = ppdev->lMCLKPeriod / ppdev->lBusWidth; if (lFifoAReadPeriod == lMemReadPeriod) lFifoAEffWritePeriod = 1000000000; else lFifoAEffWritePeriod = (lMemReadPeriod * lFifoAReadPeriod) / (lFifoAReadPeriod - lMemReadPeriod); if (lFifoBReadPeriod == lMemReadPeriod) lFifoBEffWritePeriod = 1000000000; else lFifoBEffWritePeriod = (lMemReadPeriod * lFifoBReadPeriod) / (lFifoBReadPeriod - lMemReadPeriod); if (lFifoCReadPeriod == lMemReadPeriod) lFifoCEffWritePeriod = 1000000000; else lFifoCEffWritePeriod = (lMemReadPeriod * lFifoCReadPeriod) / (lFifoCReadPeriod - lMemReadPeriod); // // Video capture read period // lVCapReadPeriod = (2 * ppdev->lMCLKPeriod) / ppdev->lBusWidth; if (dwFlags & OVERLAY_FLG_CAPTURE) // is capture enable ? bCapture = TRUE; else bCapture = FALSE; if (dwFlags & OVERLAY_FLG_YUVPLANAR) // is 420 format { if (dwFlags & (OVERLAY_FLG_COLOR_KEY | OVERLAY_FLG_SRC_COLOR_KEY)) // occlusion { // one video window, occlusion, 420 format bFifoAEnable = TRUE; bFifoBEnable = TRUE; bFifoCEnable = TRUE; } else { // one video window, no occlusion, 420 format bFifoAEnable = FALSE; bFifoBEnable = TRUE; bFifoCEnable = TRUE; } } else // not 420 format { if (dwFlags & (OVERLAY_FLG_COLOR_KEY | OVERLAY_FLG_SRC_COLOR_KEY)) // occlusion { if (dwFlags & OVERLAY_FLG_TWO_VIDEO) { // Two video windows, occlusion, not 420 format bFifoAEnable = TRUE; bFifoBEnable = TRUE; bFifoCEnable = TRUE; } else { // one video window, occlusion, not 420 format bFifoAEnable = TRUE; bFifoBEnable = TRUE; bFifoCEnable = FALSE; } } else { // one video window, no occlusion, not 420 format bFifoAEnable = FALSE; bFifoBEnable = TRUE; bFifoCEnable = FALSE; } } DISPDBG ((4, " FIFOA = %s, FIFOB= %s, FIFOC = %s\n", bFifoAEnable ? "yes" : "no", bFifoBEnable ? "yes" : "no", bFifoCEnable ? "yes" : "no")); lFifo1ReadPeriod = 0; lFifo2ReadPeriod = 0; lFifo3ReadPeriod = 0; if (bFifoAEnable) { if (((lFifoAReadPeriod >= lFifoBReadPeriod) || !bFifoBEnable) && // A slower than or equal than B) and ((lFifoAReadPeriod >= lFifoCReadPeriod) || !bFifoCEnable)) // A slower than or equal C { lFifo1ReadPeriod = lFifoAReadPeriod; lFifo1EffWritePeriod = lFifoAEffWritePeriod; } else if (((lFifoAReadPeriod >= lFifoBReadPeriod) || !bFifoBEnable) || // A slower than or equal B ((lFifoAReadPeriod >= lFifoCReadPeriod) || !bFifoCEnable)) // A slower than or equal C { lFifo2ReadPeriod = lFifoAReadPeriod; lFifo2EffWritePeriod = lFifoAEffWritePeriod; } else // A not slower than A or B { lFifo3ReadPeriod = lFifoAReadPeriod; lFifo3EffWritePeriod = lFifoAEffWritePeriod; } } DISPDBG ((2, "After bFifoAEnable")) ; DISPDBG ((2, "lFifo1ReadPeriod = %ld, lFifo2ReadPeriod=%ld", lFifo1ReadPeriod, lFifo2ReadPeriod)) ; DISPDBG ((2, "lFifo3ReadPeriod = %ld", lFifo3ReadPeriod)) ; if (bFifoBEnable) { if (((lFifoBReadPeriod > lFifoAReadPeriod) || !bFifoAEnable) && // B slower than A and ((lFifoBReadPeriod >= lFifoCReadPeriod) || !bFifoCEnable)) // slower than or equal A { lFifo1ReadPeriod = lFifoBReadPeriod; lFifo1EffWritePeriod = lFifoBEffWritePeriod; } else if (((lFifoBReadPeriod > lFifoAReadPeriod) || !bFifoAEnable) || // B slower than A or ((lFifoBReadPeriod >= lFifoCReadPeriod) || !bFifoCEnable)) // B slower than or equal C { lFifo2ReadPeriod = lFifoBReadPeriod; lFifo2EffWritePeriod = lFifoBEffWritePeriod; } else // (B not slower than A ) and (B not slower than or equal C) { lFifo3ReadPeriod = lFifoBReadPeriod; lFifo3EffWritePeriod = lFifoBEffWritePeriod; } } else DISPDBG ((4, "After bFifoBEnable")) ; DISPDBG ((4, "lFifo1ReadPeriod = %ld, lFifo2ReadPeriod=%ld", lFifo1ReadPeriod, lFifo2ReadPeriod)) ; DISPDBG ((4, "lFifo3ReadPeriod = %ld", lFifo3ReadPeriod)) ; if (bFifoCEnable) { if (((lFifoCReadPeriod > lFifoAReadPeriod) || !bFifoAEnable) && // C slower than A and ((lFifoCReadPeriod > lFifoBReadPeriod) || !bFifoBEnable)) // C slower than B { lFifo1ReadPeriod = lFifoCReadPeriod; lFifo1EffWritePeriod = lFifoCEffWritePeriod; } else if (((lFifoCReadPeriod > lFifoAReadPeriod) || !bFifoAEnable) || // C slower than A or ((lFifoCReadPeriod > lFifoBReadPeriod) || !bFifoBEnable)) // C slower than B { lFifo2ReadPeriod = lFifoCReadPeriod; lFifo2EffWritePeriod = lFifoCEffWritePeriod; } else { // C not slower than A and C not slower than B lFifo3ReadPeriod = lFifoCReadPeriod; lFifo3EffWritePeriod = lFifoCEffWritePeriod; } } DISPDBG ((4, "After bFifoCEnable")) ; DISPDBG ((4, "lFifo1ReadPeriod = %ld, lFifo2ReadPeriod=%ld", lFifo1ReadPeriod, lFifo2ReadPeriod)) ; DISPDBG ((4, "lFifo3ReadPeriod = %ld", lFifo3ReadPeriod)) ; DISPDBG ((4, "lFifo1EffWritePeriod = %ld, lFifo2EffWritePeriod = %ld", lFifo1EffWritePeriod, lFifo2EffWritePeriod)) ; DISPDBG ((4, " lFifo3EffWritePeriod = %ld", lFifo3EffWritePeriod)) ; DISPDBG ((4, " lFifoAEffWritePeriod = %ld, lFifoBEffWritePeriod = %ld", lFifoAEffWritePeriod, lFifoBEffWritePeriod)) ; DISPDBG ((4, " lFifoCEffWritePeriod = %ld", lFifoCEffWritePeriod)) ; bModePass = FALSE; lThreshold = 1; CrtFifoCount = 0; if (bFifoAEnable) CrtFifoCount++; if (bFifoBEnable) CrtFifoCount++; if (bFifoCEnable) CrtFifoCount++; while ((!bModePass) && (lThreshold < 16)) { bModePass = TRUE; // assume pass until proven otherwise. // // Checking capture // if (bCapture) { lVCapLatency = (BLIT_LATENCY + RAS_PRECHARGE) * ppdev->lMCLKPeriod; lVCapBytesToEmpty = CAP_FIFO_DEPTH; lVCapEmptyTime = lVCapReadPeriod * lVCapBytesToEmpty; lVCapLevelRemaining = (lVCapLatency + lVCapEmptyTime) / lVCapWritePeriod; if (lVCapLevelRemaining > CAP_FIFO_DEPTH) return(FALSE); } // // Fill FIFO 1 // if (bCapture) lFifo1Latency = lVCapLatency + lVCapEmptyTime + (BLIT_LATENCY + RAS_PRECHARGE) * ppdev->lMCLKPeriod; else lFifo1Latency = (BLIT_LATENCY + RAS_PRECHARGE) * ppdev->lMCLKPeriod; lFifo1BytesToFill = ((16 - lThreshold) * 16) + (lFifo1Latency / lFifo1ReadPeriod); lFifo1FillTime = lFifo1EffWritePeriod * lFifo1BytesToFill; if (lFifo1BytesToFill > 256) bModePass = FALSE; DISPDBG ((4, "After Fill FIFO1, lFifo1BytesToFillb=%ld, ModePass = %s", lFifo1BytesToFill, bModePass ? "yes" : "no")) ; DISPDBG ((4, "f1_latency=%ld, f1_read_period=%ld", lFifo1Latency, lFifo1ReadPeriod)) ; DISPDBG ((4, "mclkperiod= %ld, vclkperiod=%ld", ppdev->lMCLKPeriod, lVCLKPeriod)) ; // // Fill FIFO 2 // if (CrtFifoCount > 1) { lFifo2Latency = lFifo1Latency + lFifo1FillTime + (RAS_PRECHARGE * ppdev->lMCLKPeriod); lFifo2BytesToFill = ((16 - lThreshold) * 16) + (lFifo2Latency / lFifo2ReadPeriod); lFifo2FillTime = lFifo2EffWritePeriod * lFifo2BytesToFill; if (lFifo2BytesToFill > 256) bModePass = FALSE; } else { lFifo2Latency = lFifo1Latency + lFifo1FillTime; lFifo2BytesToFill = 0; lFifo2FillTime = 0; } DISPDBG ((4, "After Fill FIFO2, lFifo2BytesToFill=%ld, ModePass = %s", lFifo2BytesToFill, bModePass ? "yes" : "no")); // // Fill FIFO 3 // if (CrtFifoCount > 2) { lFifo3Latency = lFifo2Latency + lFifo2FillTime + (RAS_PRECHARGE * ppdev->lMCLKPeriod); lFifo3BytesToFill = ((16 - lThreshold) * 16) + (lFifo3Latency / lFifo3ReadPeriod); lFifo3FillTime = lFifo3EffWritePeriod * lFifo3BytesToFill; if (lFifo3BytesToFill > 256) bModePass = FALSE; } else { lFifo3Latency = lFifo2Latency + lFifo2FillTime; lFifo3BytesToFill = 0; lFifo3FillTime = 0; } DISPDBG ((4, "After Fill FIFO3, lFifo3BytesToFill=%ld, ModePass = %s", lFifo3BytesToFill, bModePass ? "yes" : "no")) ; // // Determine total latency through the sequence // lTotalLatency = lFifo3Latency + lFifo3FillTime; // // Now back to start of sequence, make sure that none of the FIFOs // have already initiated another request. // // // Check capture FIFO status // if (bCapture) { lVCapLatency = lTotalLatency; lVCapBytesToEmpty = lTotalLatency / lVCapWritePeriod; if (lVCapBytesToEmpty > CAP_FIFO_DEPTH) bModePass = FALSE; } // // Check FIFO 1 status // lFifo1Latency = lTotalLatency - lFifo1Latency - lFifo1FillTime; lFifo1BytesToFill = lFifo1Latency / lFifo1ReadPeriod; if (lFifo1BytesToFill > ((16 - lThreshold) * 16)) bModePass = FALSE; DISPDBG ((4, "After CheckF FIFO1, fifo1bytestofill %ld,bModePass = %s", lFifo1BytesToFill, bModePass ? "yes" : "no")) ; // // Check FIFO 2 status // if (CrtFifoCount > 1) { lFifo2Latency = lTotalLatency - lFifo2Latency - lFifo2FillTime; lFifo2BytesToFill = lFifo2Latency / lFifo2ReadPeriod; if (lFifo2BytesToFill > ((16 - lThreshold) * 16)) bModePass = FALSE; DISPDBG ((4, "After Check FIFO 2, fifo1bytestofill=%ld, bModePass = %s", lFifo2BytesToFill, bModePass ? "yes" : "no")) ; } if (!bModePass) lThreshold++; } if (bModePass) { DISPDBG ((1, "Is sufficient Bandwidth, thresh = %ld, return TRUE\n", lThreshold)); if (ppdev->cBitsPerPixel == 24) lThreshold = 0x0F; ppdev->lFifoThresh = lThreshold; return TRUE ; } DISPDBG ((2, "Is sufficient Bandwidth, thresh = %ld, rerurn FALSE", lThreshold)); return FALSE; } /********************************************************** * * Name: GetVCLK * * Module Abstract: * ---------------- * Returns the VCLK frequency * 1000. * * Input Parameters: * ----------------- * none * * Output Parameters: * ------------------ * MCLK * *********************************************************** * Author: Shuhua Ge * Date: 09/25/96 * * Revision History: * ----------------- * WHO WHEN WHAT/WHY/HOW * --- ---- ------------ * *********************************************************/ LONG GetVCLK(PDEV* ppdev) { LONG lTemp; LONG lRegSR1F; LONG lRegMISC; LONG lNR; LONG lDR; LONG lPS; BYTE* pjPorts = ppdev->pjPorts; /* * First read SR1F. This tells us if VCLK is derived from MCLK * or if it's derived normally. */ CP_OUT_BYTE(pjPorts, SR_INDEX, 0x1f); lRegSR1F = (LONG) CP_IN_BYTE(pjPorts, SR_DATA); if (lRegSR1F & 0x40) { LONG lMCLK; /* * It is derived from MCLK, but now we need to read SR1E to see * if VCLK = MCLK or if VCLK = MCLK/2. */ lMCLK = (lRegSR1F & 0x3F) * 14318; CP_OUT_BYTE(pjPorts, SR_INDEX, 0x1e); if (CP_IN_BYTE(pjPorts, SR_DATA) & 0x01) { return (lMCLK >> 4); } else { return (lMCLK >> 3); } } else { /* * Read MISC[3:2], which tells us where to find our VCLK */ lRegMISC = (LONG) CP_IN_BYTE(pjPorts, 0x3cc); lRegMISC >>= 2; //myf33 begin CP_OUT_BYTE(pjPorts, CRTC_INDEX, (BYTE)0x80); if (((ppdev->ulChipID == CL7555_ID) || (ppdev->ulChipID == CL7556_ID)) && (CP_IN_BYTE(pjPorts, CRTC_DATA) & 0x01)) lRegMISC &= 0x02; // Fixed PDR 8709 else //myf33 end lRegMISC &= 0x03; lNR = 0x0B + lRegMISC; lDR = 0x1B + lRegMISC; /* * Read the values for bP, bDR, and bNR */ CP_OUT_BYTE(pjPorts, SR_INDEX, (BYTE) lDR); lPS = lDR = (LONG)CP_IN_BYTE(pjPorts, SR_DATA); CP_OUT_BYTE(pjPorts, SR_INDEX, (BYTE) lNR); lNR = (LONG)CP_IN_BYTE(pjPorts, SR_DATA); lPS &= 0x01; lPS += 1; lDR >>= 1; // // Extended the VCLK bits. // // sge06 lDR &= 0x7f; lNR &= 0x7f; /* * VCLK = (14.31818 * bNR) / (bDR * bPS) */ lTemp = (14318 * lNR); if (!lPS || !lDR) { return (0); } lTemp /= (lDR * lPS); } return (lTemp); } /********************************************************** * * Name: EnableStartAddrDoubleBuffer * * Module Abstract: * ---------------- * Enable the double buffering of the start addresses. This allows the page * flipping operation to proceed without the system CPU waiting for VRT. * * Input Parameters: * ----------------- * none * * Output Parameters: * ------------------ * *********************************************************** * Author: Shuhua Ge * Date: 10/01/96 * * Revision History: * ----------------- * WHO WHEN WHAT/WHY/HOW * --- ---- ------------ * *********************************************************/ VOID EnableStartAddrDoubleBuffer(PDEV* ppdev) { BYTE* pjPorts = ppdev->pjPorts; BYTE cTemp; CP_OUT_BYTE(pjPorts, CRTC_INDEX, 0x1a); cTemp = CP_IN_BYTE(pjPorts, CRTC_DATA); CP_OUT_BYTE(pjPorts, CRTC_DATA, cTemp | 2); } /********************************************************** * * Name: GetCurrentVLine * * Module Abstract: * ---------------- * Get the current scan line * * Input Parameters: * ----------------- * none * * Output Parameters: * ------------------ * *********************************************************** * Author: Shuhua Ge * Date: 10/01/96 * * Revision History: * ----------------- * WHO WHEN WHAT/WHY/HOW * --- ---- ------------ * *********************************************************/ DWORD GetCurrentVLine(PDEV* ppdev) { DWORD dwLine; BYTE cTemp; BYTE* pjPorts = ppdev->pjPorts; CP_OUT_BYTE(pjPorts, INDEX_REG, 0x16); /* Index to the low byte. */ dwLine = (ULONG)CP_IN_BYTE(pjPorts, DATA_REG); CP_OUT_BYTE(pjPorts, INDEX_REG, 0x17); /* Index to the high bits. */ cTemp = CP_IN_BYTE(pjPorts, DATA_REG); dwLine |= (cTemp & 3) << 8; CP_OUT_BYTE(pjPorts, INDEX_REG, 0x16); /* Index to the low byte. */ /* If we wrapped around while getting the high bits we have a problem. */ /* The high bits may be wrong. */ if((CP_IN_BYTE(pjPorts, DATA_REG)) < (dwLine & 0xff)) { DISPDBG((1, "Recursive call to GetCurrentVLine.")); return GetCurrentVLine(ppdev); } if (dwLine > ppdev->dwVsyncLine) { return 0; } return dwLine; } #endif #endif // DIRECTDRAW