//===== Copyright © 1996-2005, Valve Corporation, All rights reserved. ======// // // Purpose: // // $NoKeywords: $ //===========================================================================// #include "tier2/beamsegdraw.h" #include "materialsystem/imaterialvar.h" #include "convar.h" // memdbgon must be the last include file in a .cpp file!!! #include "tier0/memdbgon.h" //----------------------------------------------------------------------------- // // CBeamSegDraw implementation. // //----------------------------------------------------------------------------- void CBeamSegDraw::Start( IMatRenderContext *pRenderContext, int nSegs, IMaterial *pMaterial, CMeshBuilder *pMeshBuilder, int nMeshVertCount ) { m_pRenderContext = pRenderContext; Assert( nSegs >= 2 ); m_nSegsDrawn = 0; m_nTotalSegs = nSegs; m_pRenderContext->GetWorldSpaceCameraPosition( &m_vecCameraPos ); if ( pMeshBuilder ) { m_pMeshBuilder = pMeshBuilder; m_nMeshVertCount = nMeshVertCount; } else { m_pMeshBuilder = NULL; m_nMeshVertCount = 0; IMesh *pMesh = m_pRenderContext->GetDynamicMesh( true, NULL, NULL, pMaterial ); m_Mesh.Begin( pMesh, MATERIAL_TRIANGLE_STRIP, (nSegs-1) * 2 ); } } inline void CBeamSegDraw::ComputeNormal( const Vector &vecCameraPos, const Vector &vStartPos, const Vector &vNextPos, Vector *pNormal ) { // vTangentY = line vector for beam Vector vTangentY; VectorSubtract( vStartPos, vNextPos, vTangentY ); // vDirToBeam = vector from viewer origin to beam Vector vDirToBeam; VectorSubtract( vStartPos, vecCameraPos, vDirToBeam ); // Get a vector that is perpendicular to us and perpendicular to the beam. // This is used to fatten the beam. CrossProduct( vTangentY, vDirToBeam, *pNormal ); VectorNormalizeFast( *pNormal ); } inline void CBeamSegDraw::SpecifySeg( const Vector &vecCameraPos, const Vector &vNormal ) { // SUCKY: Need to do a fair amount more work to get the tangent owing to the averaged normal Vector vDirToBeam, vTangentY; VectorSubtract( m_Seg.m_vPos, vecCameraPos, vDirToBeam ); CrossProduct( vDirToBeam, vNormal, vTangentY ); VectorNormalizeFast( vTangentY ); // Build the endpoints. Vector vPoint1, vPoint2; VectorMA( m_Seg.m_vPos, m_Seg.m_flWidth*0.5f, vNormal, vPoint1 ); VectorMA( m_Seg.m_vPos, -m_Seg.m_flWidth*0.5f, vNormal, vPoint2 ); if ( m_pMeshBuilder ) { // Specify the points. m_pMeshBuilder->Position3fv( vPoint1.Base() ); m_pMeshBuilder->Color4ubv( (const unsigned char *) &m_Seg.m_color ); m_pMeshBuilder->TexCoord2f( 0, 0, m_Seg.m_flTexCoord ); m_pMeshBuilder->TexCoord2f( 1, 0, m_Seg.m_flTexCoord ); m_pMeshBuilder->TangentS3fv( vNormal.Base() ); m_pMeshBuilder->TangentT3fv( vTangentY.Base() ); m_pMeshBuilder->AdvanceVertex(); m_pMeshBuilder->Position3fv( vPoint2.Base() ); m_pMeshBuilder->Color4ubv( (const unsigned char *) &m_Seg.m_color ); m_pMeshBuilder->TexCoord2f( 0, 1, m_Seg.m_flTexCoord ); m_pMeshBuilder->TexCoord2f( 1, 1, m_Seg.m_flTexCoord ); m_pMeshBuilder->TangentS3fv( vNormal.Base() ); m_pMeshBuilder->TangentT3fv( vTangentY.Base() ); m_pMeshBuilder->AdvanceVertex(); if ( m_nSegsDrawn > 1 ) { int nBase = ( ( m_nSegsDrawn - 2 ) * 2 ) + m_nMeshVertCount; m_pMeshBuilder->FastIndex( nBase ); m_pMeshBuilder->FastIndex( nBase + 1 ); m_pMeshBuilder->FastIndex( nBase + 2 ); m_pMeshBuilder->FastIndex( nBase + 1 ); m_pMeshBuilder->FastIndex( nBase + 3 ); m_pMeshBuilder->FastIndex( nBase + 2 ); } } else { // Specify the points. m_Mesh.Position3fv( vPoint1.Base() ); m_Mesh.Color4ubv( (const unsigned char *) &m_Seg.m_color ); m_Mesh.TexCoord2f( 0, 0, m_Seg.m_flTexCoord ); m_Mesh.TexCoord2f( 1, 0, m_Seg.m_flTexCoord ); m_Mesh.TangentS3fv( vNormal.Base() ); m_Mesh.TangentT3fv( vTangentY.Base() ); m_Mesh.AdvanceVertex(); m_Mesh.Position3fv( vPoint2.Base() ); m_Mesh.Color4ubv( (const unsigned char *) &m_Seg.m_color ); m_Mesh.TexCoord2f( 0, 1, m_Seg.m_flTexCoord ); m_Mesh.TexCoord2f( 1, 1, m_Seg.m_flTexCoord ); m_Mesh.TangentS3fv( vNormal.Base() ); m_Mesh.TangentT3fv( vTangentY.Base() ); m_Mesh.AdvanceVertex(); } } void CBeamSegDraw::NextSeg( BeamSeg_t *pSeg ) { if ( m_nSegsDrawn > 0 ) { // Get a vector that is perpendicular to us and perpendicular to the beam. // This is used to fatten the beam. Vector vNormal, vAveNormal; ComputeNormal( m_vecCameraPos, m_Seg.m_vPos, pSeg->m_vPos, &vNormal ); if ( m_nSegsDrawn > 1 ) { // Average this with the previous normal VectorAdd( vNormal, m_vNormalLast, vAveNormal ); vAveNormal *= 0.5f; VectorNormalizeFast( vAveNormal ); } else { vAveNormal = vNormal; } m_vNormalLast = vNormal; SpecifySeg( m_vecCameraPos, vAveNormal ); } m_Seg = *pSeg; ++m_nSegsDrawn; if( m_nSegsDrawn == m_nTotalSegs ) { SpecifySeg( m_vecCameraPos, m_vNormalLast ); } } void CBeamSegDraw::LoadSIMDData( FourVectors * RESTRICT pV4StartPos, FourVectors * RESTRICT pV4EndPos, FourVectors * RESTRICT pV4HalfWidth, int nV4SegCount, const BeamSeg_t * pSegs ) { const BeamSeg_t *RESTRICT pCurSeg = pSegs; for ( int i = 0; i < nV4SegCount; ++i, pCurSeg+= 4 ) { pV4StartPos[i].LoadAndSwizzleAligned( pCurSeg[0].m_vPos, pCurSeg[1].m_vPos, pCurSeg[2].m_vPos, pCurSeg[3].m_vPos ); pV4EndPos[i].LoadAndSwizzleAligned( pCurSeg[1].m_vPos, pCurSeg[2].m_vPos, pCurSeg[3].m_vPos, pCurSeg[4].m_vPos ); // load and broadcast the halfwidths // if you load from values in memory (rather than computed values in registers), // .Load is faster. pV4HalfWidth[i].Load( pCurSeg[0].m_flWidth , pCurSeg[1].m_flWidth , pCurSeg[2].m_flWidth , pCurSeg[3].m_flWidth ); pV4HalfWidth[i] *= Four_PointFives; } } void CBeamSegDraw::ComputeRenderInfo( BeamSegRenderInfo_t * pRenderInfo, const Vector &vecCameraPos, int nSegCount, const BeamSeg_t *pSrcSegs ) RESTRICT { int nPaddedSegCount = ( ( nSegCount + 3 ) >> 2 ) << 2; // FIXME: Can we figure out a way of avoiding this extra copy? // NOTE: We need an extra one since LoadSIMDData will load off the end BeamSeg_t *pSegs = (BeamSeg_t*)stackalloc( ( nPaddedSegCount + 1 ) * sizeof(BeamSeg_t) ); memcpy( pSegs, pSrcSegs, nSegCount * sizeof(BeamSeg_t) ); int nEndSegCount = ( nPaddedSegCount - nSegCount + 1 ); BeamSeg_t endCap = pSrcSegs[nSegCount-1]; endCap.m_vPos += pSrcSegs[nSegCount-1].m_vPos - pSrcSegs[nSegCount-2].m_vPos; for ( int i = 0; i < nEndSegCount; ++i ) { memcpy( &pSegs[nSegCount+i], &endCap, sizeof(BeamSeg_t) ); } FourVectors v4CameraPos; v4CameraPos.LoadAndSwizzle( vecCameraPos ); int nV4SegCount = nPaddedSegCount >> 2; FourVectors *pV4StartPos = (FourVectors*)stackalloc( nV4SegCount * sizeof(FourVectors) ); FourVectors *pV4EndPos = (FourVectors*)stackalloc( nV4SegCount * sizeof(FourVectors) ); FourVectors *pV4HalfWidth = (FourVectors*)stackalloc( nV4SegCount * sizeof(FourVectors) ); FourVectors *pV4AveNormals = (FourVectors*)stackalloc( ( nV4SegCount + 2 ) * sizeof(FourVectors) ); CBeamSegDraw::LoadSIMDData( pV4StartPos, pV4EndPos, pV4HalfWidth, nV4SegCount, pSegs ); fltx4 v4LMask = { 0.25f, 0.25f, 0.25f, 0.0f }; fltx4 v4LPrevMask = { 0.0f, 0.0f, 0.0f, 0.25f }; fltx4 v4RMask = { 0.0f, 0.25f, 0.25f, 0.25f }; fltx4 v4RNextMask = { 0.25f, 0.0f, 0.0f, 0.0f }; fltx4 v4AveFactor = { 0.5f, 0.5f, 0.5f, 0.5f }; // This is the only ones that need initial data are the first two memset( pV4AveNormals, 0, 2 * sizeof(FourVectors) ); // Yes, that 1 is correct. We're going to write bogus crap on either end FourVectors eps( FLT_EPSILON ); FourVectors *pV4CurAveNormal = &pV4AveNormals[1]; for ( int i = 0; i < nV4SegCount; ++i, ++pV4CurAveNormal ) { // prefetch PREFETCH360( pRenderInfo + (i << 2), 0 ); PREFETCH360( pRenderInfo + (i << 2) + 1, 0 ); FourVectors v4TangentY = pV4StartPos[i] - pV4EndPos[i]; FourVectors v4CameraToStart = pV4StartPos[i] - v4CameraPos; FourVectors v4Normal = v4TangentY ^ v4CameraToStart; v4Normal += eps; v4Normal = VectorNormalizeFast( v4Normal ); FourVectors v4LNormal = RotateLeft( v4Normal ); FourVectors v4RNormal = RotateRight( v4Normal ); pV4CurAveNormal[0] = Madd( v4Normal, v4AveFactor, pV4CurAveNormal[0] ); pV4CurAveNormal[0] = Madd( v4LNormal, v4LMask, pV4CurAveNormal[0] ); pV4CurAveNormal[0] = Madd( v4RNormal, v4RMask, pV4CurAveNormal[0] ); pV4CurAveNormal[-1] = Madd( v4LNormal, v4LPrevMask, pV4CurAveNormal[-1] ); pV4CurAveNormal[1] = Mul( v4RNormal, v4RNextMask ); } // FIXME: Do I need to fixup the endpoints, to clamp their normals to the unsmoothed value? // Maybe I can get away with not doing that. FourVectors *pV4Normals = &pV4AveNormals[1]; FourVectors *pV4TangentY = (FourVectors*)stackalloc( nV4SegCount * sizeof(FourVectors) ); FourVectors *pV4Point1 = (FourVectors*)stackalloc( nV4SegCount * sizeof(FourVectors) ); FourVectors *pV4Point2 = (FourVectors*)stackalloc( nV4SegCount * sizeof(FourVectors) ); for ( int i = 0; i < nV4SegCount; ++i ) { // prefetch // (write top half rows) PREFETCH360( pRenderInfo + (i << 2) + 2, 0 ); PREFETCH360( pRenderInfo + (i << 2) + 3, 0 ); FourVectors v4Normal = VectorNormalizeFast( pV4Normals[i] ); FourVectors v4CameraToStart = pV4StartPos[i] - v4CameraPos; FourVectors v4TangentY = v4CameraToStart ^ v4Normal; pV4Normals[i] = v4Normal; v4TangentY += eps; pV4TangentY[i] = VectorNormalizeFast( v4TangentY ); FourVectors v4Offset = Mul( v4Normal, pV4HalfWidth[i] ); pV4Point1[i] = pV4StartPos[i] + v4Offset; pV4Point2[i] = pV4StartPos[i] - v4Offset; } const BeamSeg_t * RESTRICT pSeg = pSrcSegs; // The code below has a few load-hit-stores (due to the // transform to vector for store). For an alternate // pathway that does the same thing without the LHS, // see changelist 588032. It was more complicated, but // didn't profile to actually be any faster, so it // was taken back out. for ( int i = 0 ; i < nSegCount; ++i, ++pRenderInfo, ++pSeg ) { int nIndex = ( i >> 2 ); int j = ( i & 0x3 ); pRenderInfo->m_vecCenter = pV4StartPos[nIndex].Vec( j ); pRenderInfo->m_vecPoint1 = pV4Point1[nIndex].Vec( j ); pRenderInfo->m_vecPoint2 = pV4Point2[nIndex].Vec( j ); pRenderInfo->m_vecTangentS = pV4Normals[nIndex].Vec( j ); pRenderInfo->m_vecTangentT = pV4TangentY[nIndex].Vec( j ); pRenderInfo->m_flTexCoord = pSeg->m_flTexCoord; pRenderInfo->m_color = pSeg->m_color; } } void CBeamSegDraw::End() { if ( m_pMeshBuilder ) { m_pMeshBuilder = NULL; return; } m_Mesh.End( false, true ); } //----------------------------------------------------------------------------- // Purpose: //----------------------------------------------------------------------------- void CBeamSegDrawArbitrary::SetNormal( const Vector &normal ) { m_vNormalLast = normal; } //----------------------------------------------------------------------------- // Purpose: //----------------------------------------------------------------------------- void CBeamSegDrawArbitrary::NextSeg( BeamSeg_t *pSeg ) { if ( m_nSegsDrawn > 0 ) { Vector segDir = ( m_PrevSeg.m_vPos - pSeg->m_vPos ); VectorNormalize( segDir ); Vector normal = CrossProduct( segDir, m_vNormalLast ); SpecifySeg( normal ); } m_PrevSeg = m_Seg; m_Seg = *pSeg; ++m_nSegsDrawn; } void CBeamSegDrawArbitrary::SpecifySeg( const Vector &vNormal ) { // Build the endpoints. Vector vPoint1, vPoint2; Vector vDelta; VectorMultiply( vNormal, m_Seg.m_flWidth*0.5f, vDelta ); VectorAdd( m_Seg.m_vPos, vDelta, vPoint1 ); VectorSubtract( m_Seg.m_vPos, vDelta, vPoint2 ); m_Mesh.Position3fv( vPoint1.Base() ); m_Mesh.Color4ub( m_Seg.m_color.r, m_Seg.m_color.g, m_Seg.m_color.b, m_Seg.m_color.a ); m_Mesh.TexCoord2f( 0, 0, m_Seg.m_flTexCoord ); m_Mesh.TexCoord2f( 1, 0, m_Seg.m_flTexCoord ); m_Mesh.AdvanceVertex(); m_Mesh.Position3fv( vPoint2.Base() ); m_Mesh.Color4ub( m_Seg.m_color.r, m_Seg.m_color.g, m_Seg.m_color.b, m_Seg.m_color.a ); m_Mesh.TexCoord2f( 0, 1, m_Seg.m_flTexCoord ); m_Mesh.TexCoord2f( 1, 1, m_Seg.m_flTexCoord ); m_Mesh.AdvanceVertex(); }