Leaked source code of windows server 2003
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

322 lines
11 KiB

  1. #include "pch.cpp"
  2. #pragma hdrstop
  3. //---------------------------------------------------------------------
  4. // This function uses Cramer's Rule to calculate the matrix inverse.
  5. // See nt\private\windows\opengl\serever\soft\so_math.c
  6. //
  7. // Returns:
  8. // 0 - if success
  9. // -1 - if input matrix is singular
  10. //
  11. int Inverse4x4(D3DMATRIX *src, D3DMATRIX *inverse)
  12. {
  13. double x00, x01, x02;
  14. double x10, x11, x12;
  15. double x20, x21, x22;
  16. double rcp;
  17. double x30, x31, x32;
  18. double y01, y02, y03, y12, y13, y23;
  19. double z02, z03, z12, z13, z22, z23, z32, z33;
  20. #define x03 x01
  21. #define x13 x11
  22. #define x23 x21
  23. #define x33 x31
  24. #define z00 x02
  25. #define z10 x12
  26. #define z20 x22
  27. #define z30 x32
  28. #define z01 x03
  29. #define z11 x13
  30. #define z21 x23
  31. #define z31 x33
  32. /* read 1st two columns of matrix into registers */
  33. x00 = src->_11;
  34. x01 = src->_12;
  35. x10 = src->_21;
  36. x11 = src->_22;
  37. x20 = src->_31;
  38. x21 = src->_32;
  39. x30 = src->_41;
  40. x31 = src->_42;
  41. /* compute all six 2x2 determinants of 1st two columns */
  42. y01 = x00*x11 - x10*x01;
  43. y02 = x00*x21 - x20*x01;
  44. y03 = x00*x31 - x30*x01;
  45. y12 = x10*x21 - x20*x11;
  46. y13 = x10*x31 - x30*x11;
  47. y23 = x20*x31 - x30*x21;
  48. /* read 2nd two columns of matrix into registers */
  49. x02 = src->_13;
  50. x03 = src->_14;
  51. x12 = src->_23;
  52. x13 = src->_24;
  53. x22 = src->_33;
  54. x23 = src->_34;
  55. x32 = src->_43;
  56. x33 = src->_44;
  57. /* compute all 3x3 cofactors for 2nd two columns */
  58. z33 = x02*y12 - x12*y02 + x22*y01;
  59. z23 = x12*y03 - x32*y01 - x02*y13;
  60. z13 = x02*y23 - x22*y03 + x32*y02;
  61. z03 = x22*y13 - x32*y12 - x12*y23;
  62. z32 = x13*y02 - x23*y01 - x03*y12;
  63. z22 = x03*y13 - x13*y03 + x33*y01;
  64. z12 = x23*y03 - x33*y02 - x03*y23;
  65. z02 = x13*y23 - x23*y13 + x33*y12;
  66. /* compute all six 2x2 determinants of 2nd two columns */
  67. y01 = x02*x13 - x12*x03;
  68. y02 = x02*x23 - x22*x03;
  69. y03 = x02*x33 - x32*x03;
  70. y12 = x12*x23 - x22*x13;
  71. y13 = x12*x33 - x32*x13;
  72. y23 = x22*x33 - x32*x23;
  73. /* read 1st two columns of matrix into registers */
  74. x00 = src->_11;
  75. x01 = src->_12;
  76. x10 = src->_21;
  77. x11 = src->_22;
  78. x20 = src->_31;
  79. x21 = src->_32;
  80. x30 = src->_41;
  81. x31 = src->_42;
  82. /* compute all 3x3 cofactors for 1st column */
  83. z30 = x11*y02 - x21*y01 - x01*y12;
  84. z20 = x01*y13 - x11*y03 + x31*y01;
  85. z10 = x21*y03 - x31*y02 - x01*y23;
  86. z00 = x11*y23 - x21*y13 + x31*y12;
  87. /* compute 4x4 determinant & its reciprocal */
  88. rcp = x30*z30 + x20*z20 + x10*z10 + x00*z00;
  89. if (rcp == (float)0)
  90. return -1;
  91. rcp = (float)1/rcp;
  92. /* compute all 3x3 cofactors for 2nd column */
  93. z31 = x00*y12 - x10*y02 + x20*y01;
  94. z21 = x10*y03 - x30*y01 - x00*y13;
  95. z11 = x00*y23 - x20*y03 + x30*y02;
  96. z01 = x20*y13 - x30*y12 - x10*y23;
  97. /* multiply all 3x3 cofactors by reciprocal */
  98. inverse->_11 = (float)(z00*rcp);
  99. inverse->_21 = (float)(z01*rcp);
  100. inverse->_12 = (float)(z10*rcp);
  101. inverse->_31 = (float)(z02*rcp);
  102. inverse->_13 = (float)(z20*rcp);
  103. inverse->_41 = (float)(z03*rcp);
  104. inverse->_14 = (float)(z30*rcp);
  105. inverse->_22 = (float)(z11*rcp);
  106. inverse->_32 = (float)(z12*rcp);
  107. inverse->_23 = (float)(z21*rcp);
  108. inverse->_42 = (float)(z13*rcp);
  109. inverse->_24 = (float)(z31*rcp);
  110. inverse->_33 = (float)(z22*rcp);
  111. inverse->_43 = (float)(z23*rcp);
  112. inverse->_34 = (float)(z32*rcp);
  113. inverse->_44 = (float)(z33*rcp);
  114. return 0;
  115. }
  116. //---------------------------------------------------------------------
  117. #define MATRIX_PRODUCT(res, a, b) \
  118. res->_11 = a->_11*b->_11 + a->_12*b->_21 + a->_13*b->_31 + a->_14*b->_41; \
  119. res->_12 = a->_11*b->_12 + a->_12*b->_22 + a->_13*b->_32 + a->_14*b->_42; \
  120. res->_13 = a->_11*b->_13 + a->_12*b->_23 + a->_13*b->_33 + a->_14*b->_43; \
  121. res->_14 = a->_11*b->_14 + a->_12*b->_24 + a->_13*b->_34 + a->_14*b->_44; \
  122. \
  123. res->_21 = a->_21*b->_11 + a->_22*b->_21 + a->_23*b->_31 + a->_24*b->_41; \
  124. res->_22 = a->_21*b->_12 + a->_22*b->_22 + a->_23*b->_32 + a->_24*b->_42; \
  125. res->_23 = a->_21*b->_13 + a->_22*b->_23 + a->_23*b->_33 + a->_24*b->_43; \
  126. res->_24 = a->_21*b->_14 + a->_22*b->_24 + a->_23*b->_34 + a->_24*b->_44; \
  127. \
  128. res->_31 = a->_31*b->_11 + a->_32*b->_21 + a->_33*b->_31 + a->_34*b->_41; \
  129. res->_32 = a->_31*b->_12 + a->_32*b->_22 + a->_33*b->_32 + a->_34*b->_42; \
  130. res->_33 = a->_31*b->_13 + a->_32*b->_23 + a->_33*b->_33 + a->_34*b->_43; \
  131. res->_34 = a->_31*b->_14 + a->_32*b->_24 + a->_33*b->_34 + a->_34*b->_44; \
  132. \
  133. res->_41 = a->_41*b->_11 + a->_42*b->_21 + a->_43*b->_31 + a->_44*b->_41; \
  134. res->_42 = a->_41*b->_12 + a->_42*b->_22 + a->_43*b->_32 + a->_44*b->_42; \
  135. res->_43 = a->_41*b->_13 + a->_42*b->_23 + a->_43*b->_33 + a->_44*b->_43; \
  136. res->_44 = a->_41*b->_14 + a->_42*b->_24 + a->_43*b->_34 + a->_44*b->_44;
  137. //---------------------------------------------------------------------
  138. // result = a*b
  139. // result is the same as a or b
  140. //
  141. void MatrixProduct2(D3DMATRIX *result, D3DMATRIX *a, D3DMATRIX *b)
  142. {
  143. D3DMATRIX res;
  144. MATRIX_PRODUCT((&res), a, b);
  145. *(D3DMATRIX*)result = res;
  146. }
  147. //---------------------------------------------------------------------
  148. // result = a*b.
  149. // "result" pointer could be equal to "a" or "b"
  150. //
  151. void MatrixProduct(D3DMATRIX *result, D3DMATRIX *a, D3DMATRIX *b)
  152. {
  153. if (result == a || result == b)
  154. {
  155. MatrixProduct2(result, a, b);
  156. return;
  157. }
  158. MATRIX_PRODUCT(result, a, b);
  159. }
  160. ///////////////////////////////////////////////////////////////////////////////
  161. //
  162. ///////////////////////////////////////////////////////////////////////////////
  163. //---------------------------------------------------------------------
  164. // RRProcessVertices::UpdateXformData
  165. // Updates transform data used by ProcessVertices
  166. //---------------------------------------------------------------------
  167. HRESULT
  168. RRProcessVertices::UpdateXformData()
  169. {
  170. HRESULT hr = D3D_OK;
  171. RRVIEWPORTDATA& VData = m_ViewData;
  172. RRTRANSFORMDATA& TData = m_TransformData;
  173. // Update viewport information
  174. if (m_dwDirtyFlags & RRPV_DIRTY_ZRANGE)
  175. {
  176. VData.scaleZ = m_Viewport.dvMaxZ - m_Viewport.dvMinZ;
  177. VData.offsetZ = m_Viewport.dvMinZ;
  178. // ATTENTION: This could be a Divide by Zero here if
  179. // the dvMaxZ == dvMinZ. Fix it later.
  180. VData.scaleZi = D3DVAL(1) / VData.scaleZ;
  181. }
  182. if (m_dwDirtyFlags & RRPV_DIRTY_VIEWRECT)
  183. {
  184. // Bail if we are going to cause any divide by zero exceptions.
  185. // The likely reason is that we have a bogus viewport set by
  186. // TLVertex execute buffer app.
  187. if(m_Viewport.dwWidth == 0 || m_Viewport.dwHeight == 0 )
  188. return DDERR_GENERIC;
  189. VData.dvX = D3DVAL(m_Viewport.dwX);
  190. VData.dvY = D3DVAL(m_Viewport.dwY);
  191. VData.dvWidth = D3DVAL(m_Viewport.dwWidth);
  192. VData.dvHeight = D3DVAL(m_Viewport.dwHeight);
  193. // Coefficients to compute screen coordinates from normalized window
  194. // coordinates
  195. VData.scaleX = VData.dvWidth;
  196. VData.scaleY = - VData.dvHeight;
  197. VData.offsetX = VData.dvX;
  198. VData.offsetY = VData.dvY + VData.dvHeight;
  199. #if 0
  200. // Small offset is added to prevent generation of negative screen
  201. // coordinates (this could happen because of precision errors).
  202. // Not needed (or wanted) for devices which do guardband.
  203. VData.offsetX += SMALL_NUMBER;
  204. VData.offsetY += SMALL_NUMBER;
  205. #endif
  206. VData.scaleXi = D3DVAL(1) / VData.scaleX;
  207. VData.scaleYi = D3DVAL(1) / VData.scaleY;
  208. VData.minX = VData.dvX;
  209. VData.maxX = VData.dvX + VData.dvWidth;
  210. VData.minY = VData.dvY;
  211. VData.maxY = VData.dvY + VData.dvHeight;
  212. if (m_dwTLState & RRPV_GUARDBAND)
  213. {
  214. // Because we clip by guard band window we have to use its extents
  215. D3DVALUE w = 2.0f / VData.dvWidth;
  216. D3DVALUE h = 2.0f / VData.dvHeight;
  217. D3DVALUE ax1 = -(VData.minXgb - VData.dvX) * w + 1.0f;
  218. D3DVALUE ax2 = (VData.maxXgb - VData.dvX) * w - 1.0f;
  219. D3DVALUE ay1 = (VData.maxYgb - VData.dvY) * h - 1.0f;
  220. D3DVALUE ay2 = -(VData.minYgb - VData.dvY) * h + 1.0f;
  221. VData.gb11 = 2.0f / (ax1 + ax2);
  222. VData.gb41 = VData.gb11 * (ax1 - 1.0f) * 0.5f;
  223. VData.gb22 = 2.0f / (ay1 + ay2);
  224. VData.gb42 = VData.gb22 * (ay1 - 1.0f) * 0.5f;
  225. VData.Kgbx1 = 0.5f * (1.0f - ax1);
  226. VData.Kgbx2 = 0.5f * (1.0f + ax2);
  227. VData.Kgby1 = 0.5f * (1.0f - ay1);
  228. VData.Kgby2 = 0.5f * (1.0f + ay2);
  229. }
  230. else
  231. {
  232. VData.minXgb = VData.minX;
  233. VData.maxXgb = VData.maxX;
  234. VData.minYgb = VData.minY;
  235. VData.maxYgb = VData.maxY;
  236. }
  237. }
  238. // Update Mproj*Mclip
  239. if( m_dwDirtyFlags & RRPV_DIRTY_PROJXFM )
  240. {
  241. D3DMATRIX MShift;
  242. ZeroMemory (&MShift, sizeof(D3DMATRIX));
  243. MShift._11 = 0.5f;
  244. MShift._22 = 0.5f;
  245. MShift._41 = 0.5f;
  246. MShift._42 = 0.5f;
  247. MShift._44 = 1.0f;
  248. MShift._33 = 1.0f;
  249. MatrixProduct(&TData.m_PS, &m_xfmProj, &MShift);
  250. }
  251. // Update Mview*Mproj*Mclip
  252. if( m_dwDirtyFlags & (RRPV_DIRTY_VIEWXFM | RRPV_DIRTY_PROJXFM) )
  253. {
  254. MatrixProduct(&TData.m_VPS, &m_xfmView, &TData.m_PS);
  255. Inverse4x4( (D3DMATRIX *)&TData.m_VPS, (D3DMATRIX *)&TData.m_VPSInv );
  256. }
  257. for( DWORD i=0; i< RRMAX_WORLD_MATRICES; i++)
  258. {
  259. MatrixProduct(&m_xfmCurrent[i], &m_xfmWorld[i], &TData.m_VPS);
  260. }
  261. // Compute xfmToEye (world*view) matrix (needed for lighting and fog)
  262. // if needed
  263. if (m_dwDirtyFlags & (RRPV_DIRTY_VIEWXFM |
  264. RRPV_DIRTY_WORLDXFM |
  265. RRPV_DIRTY_WORLD1XFM |
  266. RRPV_DIRTY_WORLD2XFM |
  267. RRPV_DIRTY_WORLD3XFM ))
  268. {
  269. m_dwDirtyFlags |= RRPV_DIRTY_INVERSEWORLDVIEW;
  270. }
  271. if (m_dwTLState & (RRPV_DOLIGHTING | RRPV_DOFOG | RRPV_DOCOMPUTEPOINTSIZE |
  272. RRPV_DOPASSEYENORMAL | RRPV_DOPASSEYEXYZ) &&
  273. (m_dwDirtyFlags & RRPV_DIRTY_INVERSEWORLDVIEW))
  274. {
  275. for( i=0; i< RRMAX_WORLD_MATRICES; i++)
  276. {
  277. MatrixProduct(&m_xfmToEye[i], &m_xfmWorld[i], &m_xfmView);
  278. Inverse4x4((D3DMATRIX *)&m_xfmToEye[i],
  279. (D3DMATRIX *)&m_xfmToEyeInv[i]);
  280. m_dwDirtyFlags |= RRPV_DIRTY_NEEDXFMLIGHT;
  281. }
  282. m_dwDirtyFlags &= ~RRPV_DIRTY_INVERSEWORLDVIEW;
  283. }
  284. // Clear the dirty transform flags
  285. m_dwDirtyFlags &= ~RRPV_DIRTY_XFORM;
  286. return hr;
  287. }