You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
420 lines
14 KiB
420 lines
14 KiB
// $Id:$
|
|
|
|
#ifndef RAYTRACE_H
|
|
#define RAYTRACE_H
|
|
|
|
#include <tier0/platform.h>
|
|
#include <mathlib/vector.h>
|
|
#include <mathlib/ssemath.h>
|
|
#include <mathlib/lightdesc.h>
|
|
#include <assert.h>
|
|
#include <tier1/utlvector.h>
|
|
#include <tier1/utlbuffer.h>
|
|
#include <mathlib/mathlib.h>
|
|
#include <bspfile.h>
|
|
|
|
// fast SSE-ONLY ray tracing module. Based upon various "real time ray tracing" research.
|
|
//#define DEBUG_RAYTRACE 1
|
|
|
|
class FourRays
|
|
{
|
|
public:
|
|
FourVectors origin;
|
|
FourVectors direction;
|
|
|
|
inline void Check(void) const
|
|
{
|
|
// in order to be valid to trace as a group, all four rays must have the same signs in all
|
|
// of their direction components
|
|
#ifndef NDEBUG
|
|
for(int c=1;c<4;c++)
|
|
{
|
|
Assert(direction.X(0)*direction.X(c)>=0);
|
|
Assert(direction.Y(0)*direction.Y(c)>=0);
|
|
Assert(direction.Z(0)*direction.Z(c)>=0);
|
|
}
|
|
#endif
|
|
}
|
|
// returns direction sign mask for 4 rays. returns -1 if the rays can not be traced as a
|
|
// bundle.
|
|
int CalculateDirectionSignMask(void) const;
|
|
|
|
};
|
|
|
|
/// The format a triangle is stored in for intersections. size of this structure is important.
|
|
/// This structure can be in one of two forms. Before the ray tracing environment is set up, the
|
|
/// ProjectedEdgeEquations hold the coordinates of the 3 vertices, for facilitating bounding box
|
|
/// checks needed while building the tree. afterwards, they are changed into the projected ege
|
|
/// equations for intersection purposes.
|
|
enum triangleflags
|
|
{
|
|
FCACHETRI_TRANSPARENT = 0x01,
|
|
FCACHETRI_NEGATIVE_NORMAL = 0x02,
|
|
};
|
|
|
|
|
|
struct TriIntersectData_t
|
|
{
|
|
// this structure is 16longs=64 bytes for cache line packing.
|
|
float m_flNx, m_flNy, m_flNz; // plane equation
|
|
float m_flD;
|
|
|
|
int32 m_nTriangleID; // id of the triangle.
|
|
|
|
float m_ProjectedEdgeEquations[6]; // A,B,C for each edge equation. a
|
|
// point is inside the triangle if
|
|
// a*c1+b*c2+c is negative for all 3
|
|
// edges.
|
|
|
|
uint8 m_nCoordSelect0,m_nCoordSelect1; // the triangle is projected onto a 2d
|
|
// plane for edge testing. These are
|
|
// the indices (0..2) of the
|
|
// coordinates preserved in the
|
|
// projection
|
|
|
|
uint8 m_nFlags; // triangle flags
|
|
uint8 m_unused0; // no longer used
|
|
};
|
|
|
|
|
|
struct TriGeometryData_t
|
|
{
|
|
int32 m_nTriangleID; // id of the triangle.
|
|
|
|
float m_VertexCoordData[9]; // can't use a vector in a union
|
|
|
|
uint8 m_nFlags; // triangle flags
|
|
signed char m_nTmpData0; // used by kd-tree builder
|
|
signed char m_nTmpData1; // used by kd-tree builder
|
|
|
|
|
|
// accessors to get around union annoyance
|
|
FORCEINLINE Vector &Vertex(int idx)
|
|
{
|
|
return * ( reinterpret_cast<Vector *> ( m_VertexCoordData+3*idx ) );
|
|
}
|
|
|
|
};
|
|
|
|
|
|
struct CacheOptimizedTriangle
|
|
{
|
|
|
|
union
|
|
{
|
|
TriIntersectData_t m_IntersectData;
|
|
TriGeometryData_t m_GeometryData;
|
|
} m_Data;
|
|
|
|
// accessors to get around union annoyance
|
|
FORCEINLINE Vector &Vertex(int idx)
|
|
{
|
|
return * ( reinterpret_cast<Vector *> (m_Data.m_GeometryData.m_VertexCoordData+3*idx ) );
|
|
}
|
|
|
|
FORCEINLINE const Vector &Vertex(int idx) const
|
|
{
|
|
return * ( reinterpret_cast<const Vector *> (m_Data.m_GeometryData.m_VertexCoordData+3*idx ) );
|
|
}
|
|
|
|
void ChangeIntoIntersectionFormat(void); // change information storage format for
|
|
// computing intersections.
|
|
|
|
int ClassifyAgainstAxisSplit(int split_plane, float split_value); // PLANECHECK_xxx below
|
|
|
|
// Debug - take a triangle that has been converted to intersection format and extract the vertices
|
|
// from by intersecting the planes
|
|
void ExtractVerticesFromIntersectionFormat( Vector &v0, Vector &v1, Vector &v2 ) const;
|
|
};
|
|
|
|
#define PLANECHECK_POSITIVE 1
|
|
#define PLANECHECK_NEGATIVE -1
|
|
#define PLANECHECK_STRADDLING 0
|
|
|
|
#define KDNODE_STATE_XSPLIT 0 // this node is an x split
|
|
#define KDNODE_STATE_YSPLIT 1 // this node is a ysplit
|
|
#define KDNODE_STATE_ZSPLIT 2 // this node is a zsplit
|
|
#define KDNODE_STATE_LEAF 3 // this node is a leaf
|
|
|
|
struct CacheOptimizedKDNode
|
|
{
|
|
// this is the cache intensive data structure. "Tricks" are used to fit it into 8 bytes:
|
|
//
|
|
// A) the right child is always stored after the left child, which means we only need one
|
|
// pointer
|
|
// B) The type of node (KDNODE_xx) is stored in the lower 2 bits of the pointer.
|
|
// C) for leaf nodes, we store the number of triangles in the leaf in the same place as the floating
|
|
// point splitting parameter is stored in a non-leaf node
|
|
|
|
int32 Children; // child idx, or'ed with flags above
|
|
float SplittingPlaneValue; // for non-leaf nodes, the nodes on the
|
|
// "high" side of the splitting plane
|
|
// are on the right
|
|
|
|
#ifdef DEBUG_RAYTRACE
|
|
Vector vecMins;
|
|
Vector vecMaxs;
|
|
#endif
|
|
|
|
inline int NodeType(void) const
|
|
|
|
{
|
|
return Children & 3;
|
|
}
|
|
|
|
inline int32 TriangleIndexStart(void) const
|
|
{
|
|
assert(NodeType()==KDNODE_STATE_LEAF);
|
|
return Children>>2;
|
|
}
|
|
|
|
inline int LeftChild(void) const
|
|
{
|
|
assert(NodeType()!=KDNODE_STATE_LEAF);
|
|
return Children>>2;
|
|
}
|
|
|
|
inline int RightChild(void) const
|
|
{
|
|
return LeftChild()+1;
|
|
}
|
|
|
|
inline int NumberOfTrianglesInLeaf(void) const
|
|
{
|
|
assert(NodeType()==KDNODE_STATE_LEAF);
|
|
return *((int32 *) &SplittingPlaneValue);
|
|
}
|
|
|
|
inline void SetNumberOfTrianglesInLeafNode(int n)
|
|
{
|
|
*((int32 *) &SplittingPlaneValue)=n;
|
|
}
|
|
|
|
protected:
|
|
|
|
|
|
};
|
|
|
|
|
|
struct RayTracingSingleResult
|
|
{
|
|
Vector surface_normal; // surface normal at intersection
|
|
int32 HitID; // -1=no hit. otherwise, triangle index
|
|
float HitDistance; // distance to intersection
|
|
float ray_length; // leng of initial ray
|
|
};
|
|
|
|
struct RayTracingResult
|
|
{
|
|
FourVectors surface_normal; // surface normal at intersection
|
|
ALIGN16 int32 HitIds[4] ALIGN16_POST; // -1=no hit. otherwise, triangle index
|
|
fltx4 HitDistance; // distance to intersection
|
|
};
|
|
|
|
|
|
class RayTraceLight
|
|
{
|
|
public:
|
|
FourVectors Position;
|
|
FourVectors Intensity;
|
|
};
|
|
|
|
|
|
#define RTE_FLAGS_FAST_TREE_GENERATION 1
|
|
#define RTE_FLAGS_DONT_STORE_TRIANGLE_COLORS 2 // saves memory if not needed
|
|
#define RTE_FLAGS_DONT_STORE_TRIANGLE_MATERIALS 4
|
|
|
|
enum RayTraceLightingMode_t {
|
|
DIRECT_LIGHTING, // just dot product lighting
|
|
DIRECT_LIGHTING_WITH_SHADOWS, // with shadows
|
|
GLOBAL_LIGHTING // global light w/ shadows
|
|
};
|
|
|
|
|
|
class RayStream
|
|
{
|
|
friend class RayTracingEnvironment;
|
|
|
|
RayTracingSingleResult *PendingStreamOutputs[8][4];
|
|
int n_in_stream[8];
|
|
FourRays PendingRays[8];
|
|
|
|
public:
|
|
RayStream(void)
|
|
{
|
|
memset(n_in_stream,0,sizeof(n_in_stream));
|
|
}
|
|
};
|
|
|
|
// When transparent triangles are in the list, the caller can provide a callback that will get called at each triangle
|
|
// allowing the callback to stop processing if desired.
|
|
// UNDONE: This is not currently SIMD - it really only supports single rays
|
|
// Also for efficiency FourRays really needs some kind of active mask for the cases where rays get unbundled
|
|
class ITransparentTriangleCallback
|
|
{
|
|
public:
|
|
virtual bool VisitTriangle_ShouldContinue( const TriIntersectData_t &triangle, const FourRays &rays, bi32x4 *hitMask, fltx4 *b0, fltx4 *b1, fltx4 *b2, int32 hitID ) = 0;
|
|
};
|
|
|
|
enum RTECullMode_t
|
|
{
|
|
RTE_CULL_NONE = 0,
|
|
RTE_CULL_FRONT,
|
|
RTE_CULL_BACK
|
|
};
|
|
|
|
// serialization flag bits and defines
|
|
#define RT_ENV_SERIALIZE_COLORS 1
|
|
|
|
class RayTracingEnvironment
|
|
{
|
|
public:
|
|
uint32 Flags; // RTE_FLAGS_xxx above
|
|
Vector m_MinBound;
|
|
Vector m_MaxBound;
|
|
|
|
FourVectors BackgroundColor; //< color where no intersection
|
|
CUtlVector<CacheOptimizedKDNode> OptimizedKDTree; //< the packed kdtree. root is 0
|
|
CUtlBlockVector<CacheOptimizedTriangle> OptimizedTriangleList; //< the packed triangles
|
|
CUtlVector<int32> TriangleIndexList; //< the list of triangle indices.
|
|
CUtlVector<LightDesc_t> LightList; //< the list of lights
|
|
CUtlVector<Vector> TriangleColors; //< color of tries
|
|
CUtlVector<int32> TriangleMaterials; //< material index of tries
|
|
|
|
public:
|
|
RayTracingEnvironment() : OptimizedTriangleList( 1024 )
|
|
{
|
|
BackgroundColor.DuplicateVector(Vector(1,0,0)); // red
|
|
Flags=0;
|
|
}
|
|
|
|
#if !( defined ( _DEBUG ) && defined ( HAMMER_RAYTRACE ) )
|
|
inline void* operator new( size_t size ) { MEM_ALLOC_CREDIT_( "RayTracingEnvironment" ); return MemAlloc_AllocAligned( size, 16 ); }
|
|
inline void* operator new( size_t size, int nBlockUse, const char *pFileName, int nLine ) { MEM_ALLOC_CREDIT_( "RayTracingEnvironment" ); return MemAlloc_AllocAligned( size, 16 ); }
|
|
inline void operator delete( void* p ) { MemAlloc_FreeAligned( p ); }
|
|
inline void operator delete( void* p, int nBlockUse, const char *pFileName, int nLine ) { MemAlloc_FreeAligned( p ); }
|
|
#endif
|
|
|
|
// call AddTriangle to set up the world
|
|
void AddTriangle(int32 id, const Vector &v1, const Vector &v2, const Vector &v3,
|
|
const Vector &color);
|
|
|
|
// Adds a triangle with flags & material
|
|
void AddTriangle(int32 id, const Vector &v1, const Vector &v2, const Vector &v3,
|
|
const Vector &color, uint16 flags, int32 materialIndex);
|
|
|
|
|
|
void AddQuad(int32 id, const Vector &v1, const Vector &v2, const Vector &v3,
|
|
const Vector &v4, // specify vertices in cw or ccw order
|
|
const Vector &color);
|
|
|
|
// for ease of testing.
|
|
void AddAxisAlignedRectangularSolid(int id,Vector mincoord, Vector Maxcoord,
|
|
const Vector &color);
|
|
|
|
|
|
// SetupAccelerationStructure to prepare for tracing
|
|
void SetupAccelerationStructure(void);
|
|
|
|
// lowest level intersection routine - fire 4 rays through the scene. all 4 rays must pass the
|
|
// Check() function, and t extents must be initialized. skipid can be set to exclude a
|
|
// particular id (such as the origin surface). This function finds the closest intersection.
|
|
template <RTECullMode_t cullMode>
|
|
void Trace4Rays(const FourRays &rays, fltx4 TMin, fltx4 TMax,int DirectionSignMask,
|
|
RayTracingResult *rslt_out,
|
|
int32 skip_id=-1, ITransparentTriangleCallback *pCallback = NULL );
|
|
|
|
// wrapper for the low level trace4 rays routine
|
|
void Trace4Rays(const FourRays &rays, fltx4 TMin, fltx4 TMax,int DirectionSignMask,
|
|
RayTracingResult *rslt_out,
|
|
int32 skip_id=-1, ITransparentTriangleCallback *pCallback = NULL, RTECullMode_t cullMode = RTE_CULL_NONE );
|
|
|
|
// higher level intersection routine that handles computing the mask and handling rays which do not match in direciton sign
|
|
void Trace4Rays(const FourRays &rays, fltx4 TMin, fltx4 TMax,
|
|
RayTracingResult *rslt_out,
|
|
int32 skip_id=-1, ITransparentTriangleCallback *pCallback = NULL, RTECullMode_t cullMode = RTE_CULL_NONE );
|
|
|
|
// compute virtual light sources to model inter-reflection
|
|
void ComputeVirtualLightSources(void);
|
|
|
|
|
|
// high level interface - pass viewing parameters, rendering flags, and a destination frame
|
|
// buffer, and get a ray traced scene in 32-bit rgba format
|
|
void RenderScene(int width, int height, // width and height of desired rendering
|
|
int stride, // actual width in pixels of target buffer
|
|
uint32 *output_buffer, // pointer to destination
|
|
Vector CameraOrigin, // eye position
|
|
Vector ULCorner, // word space coordinates of upper left
|
|
// monitor corner
|
|
Vector URCorner, // top right corner
|
|
Vector LLCorner, // lower left
|
|
Vector LRCorner, // lower right
|
|
RayTraceLightingMode_t lightmode=DIRECT_LIGHTING);
|
|
|
|
|
|
/// raytracing stream - lets you trace an array of rays by feeding them to this function.
|
|
/// results will not be returned until FinishStream is called. This function handles sorting
|
|
/// the rays by direction, tracing them 4 at a time, and de-interleaving the results.
|
|
|
|
void AddToRayStream(RayStream &s,
|
|
Vector const &start,Vector const &end,RayTracingSingleResult *rslt_out,
|
|
RTECullMode_t cullMode = RTE_CULL_NONE);
|
|
|
|
inline void FlushStreamEntry(RayStream &s, int msk, RTECullMode_t cullMode = RTE_CULL_NONE);
|
|
|
|
/// call this when you are done. handles all cleanup. After this is called, all rslt ptrs
|
|
/// previously passed to AddToRaySteam will have been filled in.
|
|
void FinishRayStream(RayStream &s, RTECullMode_t cullMode = RTE_CULL_NONE);
|
|
|
|
|
|
int MakeLeafNode(int first_tri, int last_tri);
|
|
|
|
|
|
float CalculateCostsOfSplit(
|
|
int split_plane,int32 const *tri_list,int ntris,
|
|
Vector MinBound,Vector MaxBound, float &split_value,
|
|
int &nleft, int &nright, int &nboth);
|
|
|
|
void RefineNode(int node_number,int32 const *tri_list,int ntris,
|
|
Vector MinBound,Vector MaxBound, int depth);
|
|
|
|
void CalculateTriangleListBounds(int32 const *tris,int ntris,
|
|
Vector &minout, Vector &maxout);
|
|
|
|
void AddInfinitePointLight(Vector position, // light center
|
|
Vector intensity); // rgb amount
|
|
|
|
// use the global variables set by LoadBSPFile to populated the RayTracingEnvironment with
|
|
// faces.
|
|
void InitializeFromLoadedBSP(void);
|
|
|
|
void AddBSPFace(int id,dface_t const &face);
|
|
|
|
// MakeRoomForTriangles - a hint telling it how many triangles we are going to add so that
|
|
// the utl vectors used can be pre-allocated
|
|
void MakeRoomForTriangles( int ntriangles );
|
|
|
|
const CacheOptimizedTriangle &GetTriangle( int32 triID )
|
|
{
|
|
return OptimizedTriangleList[triID];
|
|
}
|
|
|
|
int32 GetTriangleMaterial( int32 triID )
|
|
{
|
|
return TriangleMaterials[triID];
|
|
}
|
|
const Vector &GetTriangleColor( int triID )
|
|
{
|
|
return TriangleColors[triID];
|
|
}
|
|
|
|
// (un)serialization
|
|
size_t GetSerializationNumBytes( uint32 nSerializationFlags = 0 ) const;
|
|
void Serialize( CUtlBuffer &outbuf, uint32 nSerializationFlags = 0 ) const;
|
|
void UnSerialize( CUtlBuffer &inbuf );
|
|
|
|
};
|
|
|
|
|
|
|
|
#endif
|