Leaked source code of windows server 2003
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

2409 lines
93 KiB

  1. ///////////////////////////////////////////////////////////////////////////////
  2. // Copyright (C) Microsoft Corporation, 2000.
  3. //
  4. // pshdrval.cpp
  5. //
  6. // Direct3D Reference Device - PixelShader validation
  7. //
  8. ///////////////////////////////////////////////////////////////////////////////
  9. #include "pch.cpp"
  10. #pragma hdrstop
  11. // Use these macros when looking at CPSInstruction derived members of the current instruction (CBaseInstruction)
  12. #define _CURR_PS_INST ((CPSInstruction*)m_pCurrInst)
  13. #define _PREV_PS_INST (m_pCurrInst?((CPSInstruction*)(m_pCurrInst->m_pPrevInst)):NULL)
  14. #define SWIZZLE_XYZZ (D3DVS_X_X | D3DVS_Y_Y | D3DVS_Z_Z | D3DVS_W_Z)
  15. #define SWIZZLE_XYZW (D3DVS_X_X | D3DVS_Y_Y | D3DVS_Z_Z | D3DVS_W_W)
  16. #define SWIZZLE_XYWW (D3DVS_X_X | D3DVS_Y_Y | D3DVS_Z_W | D3DVS_W_W)
  17. #define ZAPPED_ALPHA_TEXT "Note that an unfortunate effect of the phase marker earlier in the shader is "\
  18. "that the moment it is encountered in certain hardware, values previously "\
  19. "written to alpha in any r# register, including the one noted here, are lost. "\
  20. "In order to read alpha from an r# register after the phase marker, write to it first."
  21. #define ZAPPED_ALPHA_TEXT2 "Note that an unfortunate effect of the phase marker in the shader is "\
  22. "that the moment it is encountered in certain hardware, values previously "\
  23. "written to alpha in any r# register, including r0, are lost. "\
  24. "So after a phase marker, the alpha component of r0 must be written."
  25. #define ZAPPED_BLUE_TEXT "Note that when texcrd is used with a .xy(==.rg) writemask, "\
  26. "as it is in this shader, a side effect is that anything previously "\
  27. "written to the z(==b) component of the destination r# register is lost "\
  28. "and this component becomes uninitialized. In order to read blue again, write to it first."
  29. #define ZAPPED_BLUE_TEXT2 "Note that when texcrd is used with a .xy(==.rg) writemask, "\
  30. "as it is in this shader, a side effect is that anything previously "\
  31. "written to the z(==b) component of the destination r# register is lost "\
  32. "and this component becomes uninitialized. The blue component of r0 must to be written after the texcrd."
  33. //-----------------------------------------------------------------------------
  34. // CPShaderValidator14::CPShaderValidator14
  35. //-----------------------------------------------------------------------------
  36. CPShaderValidator14::CPShaderValidator14( const DWORD* pCode,
  37. const D3DCAPS8* pCaps,
  38. DWORD Flags )
  39. : CBasePShaderValidator( pCode, pCaps, Flags )
  40. {
  41. // Note that the base constructor initialized m_ReturnCode to E_FAIL.
  42. // Only set m_ReturnCode to S_OK if validation has succeeded,
  43. // before exiting this constructor.
  44. m_Phase = 2; // default to second pass.
  45. m_pPhaseMarkerInst = NULL;
  46. m_bPhaseMarkerInShader = FALSE;
  47. m_TempRegsWithZappedAlpha = 0;
  48. m_TempRegsWithZappedBlue = 0;
  49. if( !m_bBaseInitOk )
  50. return;
  51. ValidateShader(); // If successful, m_ReturnCode will be set to S_OK.
  52. // Call GetStatus() on this object to determine validation outcome.
  53. }
  54. //-----------------------------------------------------------------------------
  55. // CPShaderValidator14::IsCurrInstTexOp
  56. //-----------------------------------------------------------------------------
  57. void CPShaderValidator14::IsCurrInstTexOp()
  58. {
  59. DXGASSERT(m_pCurrInst);
  60. switch (m_pCurrInst->m_Type)
  61. {
  62. case D3DSIO_TEX:
  63. case D3DSIO_TEXCOORD:
  64. case D3DSIO_TEXKILL:
  65. case D3DSIO_TEXDEPTH:
  66. _CURR_PS_INST->m_bTexOp = TRUE;
  67. break;
  68. }
  69. switch(m_pCurrInst->m_Type)
  70. {
  71. case D3DSIO_TEXKILL:
  72. case D3DSIO_TEXDEPTH:
  73. case D3DSIO_TEXCOORD:
  74. _CURR_PS_INST->m_bTexOpThatReadsTexture = FALSE;
  75. break;
  76. case D3DSIO_TEX:
  77. _CURR_PS_INST->m_bTexOpThatReadsTexture = TRUE;
  78. break;
  79. }
  80. }
  81. #define MAX_NUM_STAGES_2_0 6 // #defined because there are dependencies.
  82. //-----------------------------------------------------------------------------
  83. // CPShaderValidator14::InitValidation
  84. //-----------------------------------------------------------------------------
  85. BOOL CPShaderValidator14::InitValidation()
  86. {
  87. switch( m_Version >> 16 )
  88. {
  89. case 0xfffe:
  90. Spew( SPEW_GLOBAL_ERROR, NULL, "Version Token: 0x%x indicates a vertex shader. Pixel shader version token must be of the form 0xffff****.",
  91. m_Version);
  92. return FALSE;
  93. case 0xffff:
  94. break; // pixelshader - ok.
  95. default:
  96. Spew( SPEW_GLOBAL_ERROR, NULL, "Version Token: 0x%x is invalid. Pixel shader version token must be of the form 0xffff****. Aborting pixel shader validation.",
  97. m_Version);
  98. return FALSE;
  99. }
  100. if( m_pCaps )
  101. {
  102. if( (m_pCaps->PixelShaderVersion & 0x0000FFFF) < (m_Version & 0x0000FFFF) )
  103. {
  104. Spew( SPEW_GLOBAL_ERROR, NULL, "Version Token: Pixel shader version %d.%d is too high for device. Maximum supported version is %d.%d. Aborting shader validation.",
  105. D3DSHADER_VERSION_MAJOR(m_Version),D3DSHADER_VERSION_MINOR(m_Version),
  106. D3DSHADER_VERSION_MAJOR(m_pCaps->PixelShaderVersion),D3DSHADER_VERSION_MINOR(m_pCaps->PixelShaderVersion));
  107. return FALSE;
  108. }
  109. }
  110. switch(m_Version)
  111. {
  112. case D3DPS_VERSION(1,4): // DX8.1
  113. m_pInputRegFile = new CRegisterFile(2,FALSE,2,TRUE); // #regs, bWritable, max# reads/instruction, pre-shader initialized
  114. m_pConstRegFile = new CRegisterFile(8,FALSE,2,TRUE);
  115. m_pTextureRegFile = new CRegisterFile(MAX_NUM_STAGES_2_0,FALSE, 1,TRUE);
  116. m_pTempRegFile = new CRegisterFile(MAX_NUM_STAGES_2_0,TRUE,3,FALSE);
  117. break;
  118. default:
  119. Spew( SPEW_GLOBAL_ERROR, NULL, "Version Token: %d.%d is not a supported pixel shader version. Aborting pixel shader validation.",
  120. D3DSHADER_VERSION_MAJOR(m_Version),D3DSHADER_VERSION_MINOR(m_Version));
  121. return FALSE;
  122. }
  123. if( NULL == m_pInputRegFile ||
  124. NULL == m_pConstRegFile ||
  125. NULL == m_pTextureRegFile ||
  126. NULL == m_pTempRegFile )
  127. {
  128. Spew( SPEW_GLOBAL_ERROR, NULL, "Out of memory.");
  129. return FALSE;
  130. }
  131. const DWORD* pCurrToken = m_pCurrToken;
  132. // Loop through all the instructions to see if a phase change marker is present.
  133. while( *pCurrToken != D3DPS_END() )
  134. {
  135. D3DSHADER_INSTRUCTION_OPCODE_TYPE Type = (D3DSHADER_INSTRUCTION_OPCODE_TYPE)(*pCurrToken & D3DSI_OPCODE_MASK);
  136. if( D3DSIO_COMMENT == Type )
  137. {
  138. // Skip comments
  139. DWORD NumDWORDs = ((*pCurrToken) & D3DSI_COMMENTSIZE_MASK) >> D3DSI_COMMENTSIZE_SHIFT;
  140. pCurrToken += (NumDWORDs+1);
  141. continue;
  142. }
  143. if( D3DSIO_PHASE == Type )
  144. {
  145. m_bPhaseMarkerInShader = TRUE;
  146. m_Phase = 1;
  147. }
  148. pCurrToken++;
  149. // Dst param
  150. if (*pCurrToken & (1L<<31))
  151. {
  152. pCurrToken++;
  153. if( D3DSIO_DEF == Type )
  154. {
  155. pCurrToken += 4;
  156. continue;
  157. }
  158. }
  159. // Decode src param(s)
  160. while (*pCurrToken & (1L<<31))
  161. {
  162. pCurrToken++;
  163. }
  164. }
  165. return TRUE;
  166. }
  167. //-----------------------------------------------------------------------------
  168. // CPShaderValidator14::ApplyPerInstructionRules
  169. //
  170. // Returns FALSE if shader validation must terminate.
  171. // Returns TRUE if validation may proceed to next instruction.
  172. //-----------------------------------------------------------------------------
  173. BOOL CPShaderValidator14::ApplyPerInstructionRules()
  174. {
  175. if( ! Rule_InstructionRecognized() ) return FALSE; // Bail completely on unrecognized instr.
  176. if( ! Rule_InstructionSupportedByVersion() ) goto EXIT;
  177. if( ! Rule_ValidParamCount() ) goto EXIT;
  178. if( ! Rule_ValidMarker() ) goto EXIT; // must be before any rule that needs to know what the current phase is
  179. // Rules that examine source parameters
  180. if( ! Rule_ValidSrcParams() ) goto EXIT;
  181. if( ! Rule_MultipleDependentTextureReads() ) goto EXIT; // needs to be after _ValidSrcParams(), and before _ValidDstParam(), _SrcInitialized()
  182. if( ! Rule_SrcInitialized() ) goto EXIT; // needs to be before _ValidDstParam()
  183. if( ! Rule_ValidDstParam() ) goto EXIT;
  184. if( ! Rule_ValidRegisterPortUsage() ) goto EXIT;
  185. if( ! Rule_TexOpAfterArithmeticOp() ) goto EXIT;
  186. if( ! Rule_ValidTexOpStageAndRegisterUsage() ) goto EXIT;
  187. if( ! Rule_LimitedUseOfProjModifier() ) goto EXIT;
  188. if( ! Rule_ValidTEXDEPTHInstruction() ) goto EXIT;
  189. if( ! Rule_ValidTEXKILLInstruction() ) goto EXIT;
  190. if( ! Rule_ValidBEMInstruction() ) goto EXIT;
  191. if( ! Rule_ValidDEFInstruction() ) goto EXIT;
  192. if( ! Rule_ValidInstructionPairing() ) goto EXIT;
  193. if( ! Rule_ValidInstructionCount() ) goto EXIT;
  194. EXIT:
  195. return TRUE;
  196. }
  197. //-----------------------------------------------------------------------------
  198. // CPShaderValidator14::ApplyPostInstructionsRules
  199. //-----------------------------------------------------------------------------
  200. void CPShaderValidator14::ApplyPostInstructionsRules()
  201. {
  202. Rule_ValidInstructionCount(); // see if we went over the limits
  203. Rule_R0Written();
  204. }
  205. //-----------------------------------------------------------------------------
  206. //
  207. // Per Instruction Rules
  208. //
  209. //-----------------------------------------------------------------------------
  210. //-----------------------------------------------------------------------------
  211. // CPShaderValidator14::Rule_InstructionRecognized
  212. //
  213. // ** Rule:
  214. // Is the instruction opcode known? (regardless of shader version)
  215. //
  216. // ** When to call:
  217. // Per instruction.
  218. //
  219. // ** Returns:
  220. // FALSE when instruction not recognized.
  221. //
  222. //-----------------------------------------------------------------------------
  223. BOOL CPShaderValidator14::Rule_InstructionRecognized()
  224. {
  225. switch(m_pCurrInst->m_Type)
  226. {
  227. case D3DSIO_MOV:
  228. case D3DSIO_ADD:
  229. case D3DSIO_SUB:
  230. case D3DSIO_MUL:
  231. case D3DSIO_MAD:
  232. case D3DSIO_LRP:
  233. case D3DSIO_DP3:
  234. case D3DSIO_TEX:
  235. case D3DSIO_TEXBEM:
  236. case D3DSIO_TEXBEML:
  237. case D3DSIO_CND:
  238. case D3DSIO_TEXCOORD:
  239. case D3DSIO_TEXM3x2PAD:
  240. case D3DSIO_TEXM3x2TEX:
  241. case D3DSIO_TEXM3x3PAD:
  242. case D3DSIO_TEXM3x3TEX:
  243. case D3DSIO_TEXM3x3SPEC:
  244. case D3DSIO_TEXM3x3VSPEC:
  245. case D3DSIO_TEXREG2AR:
  246. case D3DSIO_TEXREG2GB:
  247. case D3DSIO_TEXKILL:
  248. case D3DSIO_END:
  249. case D3DSIO_NOP:
  250. case D3DSIO_DEF:
  251. case D3DSIO_TEXM3x2DEPTH:
  252. case D3DSIO_TEXDP3:
  253. case D3DSIO_TEXREG2RGB:
  254. case D3DSIO_DP4:
  255. case D3DSIO_CMP:
  256. case D3DSIO_TEXDP3TEX:
  257. case D3DSIO_TEXM3x3:
  258. case D3DSIO_TEXDEPTH:
  259. case D3DSIO_BEM:
  260. case D3DSIO_PHASE:
  261. return TRUE; // instruction recognized - ok.
  262. }
  263. // if we get here, the instruction is not recognized
  264. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "Unrecognized instruction. Aborting pixel shader validation.");
  265. m_ErrorCount++;
  266. return FALSE;
  267. }
  268. //-----------------------------------------------------------------------------
  269. // CPShaderValidator14::Rule_InstructionSupportedByVersion
  270. //
  271. // ** Rule:
  272. // Is the instruction supported by the current pixel shader version?
  273. //
  274. // ** When to call:
  275. // Per instruction.
  276. //
  277. // ** Returns:
  278. // FALSE when instruction not supported by version.
  279. //
  280. //-----------------------------------------------------------------------------
  281. BOOL CPShaderValidator14::Rule_InstructionSupportedByVersion()
  282. {
  283. if( D3DPS_VERSION(1,4) <= m_Version ) // 1.3 and above
  284. {
  285. switch(m_pCurrInst->m_Type)
  286. {
  287. case D3DSIO_MOV:
  288. case D3DSIO_ADD:
  289. case D3DSIO_SUB:
  290. case D3DSIO_MUL:
  291. case D3DSIO_MAD:
  292. case D3DSIO_LRP:
  293. case D3DSIO_DP3:
  294. case D3DSIO_DEF:
  295. case D3DSIO_CND:
  296. case D3DSIO_CMP:
  297. case D3DSIO_DP4:
  298. case D3DSIO_BEM:
  299. case D3DSIO_TEX:
  300. case D3DSIO_TEXKILL:
  301. case D3DSIO_TEXDEPTH:
  302. case D3DSIO_TEXCOORD:
  303. case D3DSIO_PHASE:
  304. return TRUE; // instruction supported - ok.
  305. }
  306. }
  307. switch(m_pCurrInst->m_Type)
  308. {
  309. case D3DSIO_END:
  310. case D3DSIO_NOP:
  311. return TRUE; // instruction supported - ok.
  312. }
  313. // if we get here, the instruction is not supported.
  314. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "Instruction not supported by version %d.%d pixel shader.",
  315. D3DSHADER_VERSION_MAJOR(m_Version),D3DSHADER_VERSION_MINOR(m_Version));
  316. m_ErrorCount++;
  317. return FALSE; // no more checks on this instruction
  318. }
  319. //-----------------------------------------------------------------------------
  320. // CPShaderValidator14::Rule_ValidParamCount
  321. //
  322. // ** Rule:
  323. // Is the parameter count correct for the instruction?
  324. //
  325. // DEF is a special case that is treated as having only 1 dest parameter,
  326. // even though there are also 4 source parameters. The 4 source params for DEF
  327. // are immediate float values, so there is nothing to check, and no way of
  328. // knowing whether or not those parameter tokens were actually present in the
  329. // token list - all the validator can do is skip over 4 DWORDS (which it does).
  330. //
  331. // ** When to call:
  332. // Per instruction.
  333. //
  334. // ** Returns:
  335. // FALSE when the parameter count is incorrect.
  336. //
  337. //-----------------------------------------------------------------------------
  338. BOOL CPShaderValidator14::Rule_ValidParamCount()
  339. {
  340. BOOL bBadParamCount = FALSE;
  341. if (m_pCurrInst->m_SrcParamCount + m_pCurrInst->m_DstParamCount > SHADER_INSTRUCTION_MAX_PARAMS) bBadParamCount = TRUE;
  342. switch (m_pCurrInst->m_Type)
  343. {
  344. case D3DSIO_NOP:
  345. case D3DSIO_PHASE:
  346. bBadParamCount = (m_pCurrInst->m_DstParamCount != 0) || (m_pCurrInst->m_SrcParamCount != 0); break;
  347. case D3DSIO_MOV:
  348. bBadParamCount = (m_pCurrInst->m_DstParamCount != 1) || (m_pCurrInst->m_SrcParamCount != 1); break;
  349. case D3DSIO_ADD:
  350. case D3DSIO_SUB:
  351. case D3DSIO_MUL:
  352. case D3DSIO_DP3:
  353. case D3DSIO_DP4:
  354. case D3DSIO_BEM:
  355. bBadParamCount = (m_pCurrInst->m_DstParamCount != 1) || (m_pCurrInst->m_SrcParamCount != 2); break;
  356. case D3DSIO_MAD:
  357. case D3DSIO_LRP:
  358. case D3DSIO_CND:
  359. case D3DSIO_CMP:
  360. bBadParamCount = (m_pCurrInst->m_DstParamCount != 1) || (m_pCurrInst->m_SrcParamCount != 3); break;
  361. case D3DSIO_TEXKILL:
  362. case D3DSIO_TEXDEPTH:
  363. case D3DSIO_DEF: // we skipped the last 4 parameters (float vector) - nothing to check
  364. bBadParamCount = (m_pCurrInst->m_DstParamCount != 1) || (m_pCurrInst->m_SrcParamCount != 0); break;
  365. case D3DSIO_TEX:
  366. case D3DSIO_TEXCOORD:
  367. bBadParamCount = (m_pCurrInst->m_DstParamCount != 1) || (m_pCurrInst->m_SrcParamCount != 1); break;
  368. }
  369. if (bBadParamCount)
  370. {
  371. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "Invalid parameter count.");
  372. m_ErrorCount++;
  373. return FALSE; // no more checks on this instruction
  374. }
  375. return TRUE;
  376. }
  377. //-----------------------------------------------------------------------------
  378. // CPShaderValidator14::Rule_ValidSrcParams
  379. //
  380. // ** Rule:
  381. // for each source parameter,
  382. // if current instruction is a texture instruction, then
  383. // if texcrd, source register type must be t# (texture coordinate input)
  384. // else source register type must be t# or r# (temp)
  385. // register number must be in range
  386. // _DZ and _DW are the only source modifiers allowed
  387. // no source selector allowed,
  388. // except texcrd/texld which can have: .xyz(==.xyzz), nothing(=.xyzw), and .xyw(=.xyww)
  389. // else (non texture instruction)
  390. // if in phase 1 of shader, v# registers not allowed
  391. // t# registers not allowed (only const or temp allowed)
  392. // register number must be in range
  393. // source modifier must be one of:
  394. // _NONE/_NEG/_BIAS/_BIASNEG/_SIGN/_SIGNNEG/_X2/_X2NEG
  395. // source selector must be one of:
  396. // _NOSWIZZLE/_REPLICATEALPHA/RED/GREEN/BLUE
  397. //
  398. // Note that the parameter count for D3DSIO_DEF is treated as 1
  399. // (dest only), so this rule does nothing for it.
  400. //
  401. // ** When to call:
  402. // Per instruction.
  403. //
  404. // ** Returns:
  405. // Always TRUE.
  406. //
  407. // Errors in any of the source parameters causes m_bSrcParamError[i]
  408. // to be TRUE, so later rules that only apply when a particular source
  409. // parameter was valid know whether they need to execute or not.
  410. // e.g. Rule_SrcInitialized.
  411. //
  412. //-----------------------------------------------------------------------------
  413. BOOL CPShaderValidator14::Rule_ValidSrcParams()
  414. {
  415. static DWORD s_TexcrdSrcSwizzle[MAX_NUM_STAGES_2_0];
  416. static BOOL s_bSeenTexcrdSrcSwizzle[MAX_NUM_STAGES_2_0];
  417. if( NULL == m_pCurrInst->m_pPrevInst ) // First instruction - initialize static vars
  418. {
  419. for( UINT i = 0; i < MAX_NUM_STAGES_2_0; i++ )
  420. s_bSeenTexcrdSrcSwizzle[i] = FALSE;
  421. }
  422. for( UINT i = 0; i < m_pCurrInst->m_SrcParamCount; i++ )
  423. {
  424. BOOL bFoundSrcError = FALSE;
  425. SRCPARAM* pSrcParam = &(m_pCurrInst->m_SrcParam[i]);
  426. DWORD Swizzle = pSrcParam->m_SwizzleShift;
  427. char szSourceName[32];
  428. switch(i + 1)
  429. {
  430. case 1:
  431. if( 1 == m_pCurrInst->m_SrcParamCount )
  432. sprintf( szSourceName, "(Source param) " );
  433. else
  434. sprintf( szSourceName, "(First source param) " );
  435. break;
  436. case 2:
  437. sprintf( szSourceName, "(Second source param) " );
  438. break;
  439. case 3:
  440. sprintf( szSourceName, "(Third source param) " );
  441. break;
  442. default:
  443. DXGASSERT(FALSE);
  444. }
  445. if( _CURR_PS_INST->m_bTexOp )
  446. {
  447. UINT ValidRegNum = 0;
  448. switch (m_pCurrInst->m_Type)
  449. {
  450. case D3DSIO_TEXCOORD:
  451. if( D3DSPR_TEXTURE != pSrcParam->m_RegType )
  452. {
  453. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "%sSource register type must be texture coordinate input (t#) for texcrd instruction.",
  454. szSourceName);
  455. m_ErrorCount++;
  456. bFoundSrcError = TRUE;
  457. }
  458. ValidRegNum = m_pTextureRegFile->GetNumRegs(); break;
  459. break;
  460. default:
  461. switch(pSrcParam->m_RegType)
  462. {
  463. case D3DSPR_TEMP: ValidRegNum = m_pTempRegFile->GetNumRegs(); break;
  464. case D3DSPR_TEXTURE: ValidRegNum = m_pTextureRegFile->GetNumRegs(); break;
  465. default:
  466. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "%sSource register type must be temp (r#) or texture coordinate input (t#) for tex* instruction.",
  467. szSourceName);
  468. m_ErrorCount++;
  469. bFoundSrcError = TRUE;
  470. goto LOOP_CONTINUE;
  471. }
  472. break;
  473. }
  474. if( pSrcParam->m_RegNum >= ValidRegNum )
  475. {
  476. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "%sInvalid register number: %d. Max allowed for this type is %d.",
  477. szSourceName, pSrcParam->m_RegNum, ValidRegNum - 1);
  478. m_ErrorCount++;
  479. bFoundSrcError = TRUE;
  480. }
  481. BOOL bGenericSrcModError = FALSE;
  482. switch(pSrcParam->m_SrcMod)
  483. {
  484. case D3DSPSM_NONE:
  485. break;
  486. case D3DSPSM_DZ:
  487. switch(m_pCurrInst->m_Type)
  488. {
  489. case D3DSIO_TEX:
  490. if( D3DSPR_TEMP != pSrcParam->m_RegType )
  491. {
  492. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst,
  493. "_dz(=_db) modifier on source param for texld only allowed if source is a temp register (r#)." );
  494. m_ErrorCount++;
  495. bFoundSrcError = TRUE;
  496. }
  497. if( 1 == m_Phase )
  498. {
  499. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst,
  500. "_dz(=_db) modifier on source param for texld only allowed in second phase of a shader.");
  501. m_ErrorCount++;
  502. bFoundSrcError = TRUE;
  503. }
  504. if( (SWIZZLE_XYZZ != Swizzle) &&
  505. (SWIZZLE_XYZW != Swizzle) )
  506. {
  507. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst,
  508. "_dz(=_db) modifier on source param for texld must be paired with source selector .xyz(=.rgb). "\
  509. "Note: Using no selector is treated same as .xyz here.");
  510. m_ErrorCount++;
  511. bFoundSrcError = TRUE;
  512. }
  513. break;
  514. case D3DSIO_TEXCOORD:
  515. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst,
  516. "_dz(=_db) modifier cannot be used on source parameter for texcrd. "\
  517. "It is only available to texld instruction, when source parameter is temp register (r#).");
  518. m_ErrorCount++;
  519. bFoundSrcError = TRUE;
  520. break;
  521. default:
  522. bGenericSrcModError = TRUE; break;
  523. }
  524. break;
  525. case D3DSPSM_DW:
  526. switch(m_pCurrInst->m_Type)
  527. {
  528. case D3DSIO_TEX:
  529. if( D3DSPR_TEXTURE != pSrcParam->m_RegType )
  530. {
  531. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst,
  532. "_dw(=_da) modifier on source param for texld only allowed if source is a texture coordinate register (t#)." );
  533. m_ErrorCount++;
  534. bFoundSrcError = TRUE;
  535. }
  536. // falling through
  537. case D3DSIO_TEXCOORD:
  538. if( SWIZZLE_XYWW != Swizzle )
  539. {
  540. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst,
  541. "_dw(=_da) modifier on source param must be paired with source selector .xyw(=.rga)." );
  542. m_ErrorCount++;
  543. bFoundSrcError = TRUE;
  544. }
  545. break;
  546. default:
  547. bGenericSrcModError = TRUE; break;
  548. }
  549. break;
  550. default:
  551. bGenericSrcModError = TRUE; break;
  552. }
  553. if( bGenericSrcModError )
  554. {
  555. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "%sInvalid source modifier for tex* instruction.", szSourceName);
  556. m_ErrorCount++;
  557. bFoundSrcError = TRUE;
  558. }
  559. switch (m_pCurrInst->m_Type)
  560. {
  561. case D3DSIO_TEXCOORD:
  562. if( (SWIZZLE_XYZZ != Swizzle) &&
  563. (SWIZZLE_XYZW != Swizzle) &&
  564. (SWIZZLE_XYWW != Swizzle) )
  565. {
  566. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst,
  567. "Source for texcrd requires component selector .xyw(==.rga), or .xyz(==.rgb). "\
  568. "Note: Using no selector is treated same as .xyz here.");
  569. m_ErrorCount++;
  570. bFoundSrcError = TRUE;
  571. }
  572. break;
  573. case D3DSIO_TEX:
  574. if( D3DSPR_TEXTURE == pSrcParam->m_RegType )
  575. {
  576. if( (SWIZZLE_XYZZ != Swizzle) &&
  577. (SWIZZLE_XYZW != Swizzle) &&
  578. (SWIZZLE_XYWW != Swizzle) )
  579. {
  580. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst,
  581. "Using a texture coordinate register (t#) as source for texld requires component selector .xyw(=.rga), or .xyz(=.rgb). "\
  582. "Note: Using no selector is treated same as .xyz here.");
  583. m_ErrorCount++;
  584. bFoundSrcError = TRUE;
  585. }
  586. }
  587. else if( D3DSPR_TEMP == pSrcParam->m_RegType )
  588. {
  589. if( (SWIZZLE_XYZZ != Swizzle) &&
  590. (SWIZZLE_XYZW != Swizzle) )
  591. {
  592. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst,
  593. "Using a temp register (r#) as source for texld requires component selector .xyz(==.rgb). "\
  594. "Note: Using no selector is treated same as .xyz here.");
  595. m_ErrorCount++;
  596. bFoundSrcError = TRUE;
  597. }
  598. }
  599. break;
  600. default:
  601. switch (pSrcParam->m_SwizzleShift)
  602. {
  603. case D3DSP_NOSWIZZLE:
  604. break;
  605. default:
  606. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "%sInvalid source selector for tex* instruction.", szSourceName);
  607. m_ErrorCount++;
  608. bFoundSrcError = TRUE;
  609. }
  610. break;
  611. }
  612. switch(m_pCurrInst->m_Type)
  613. {
  614. case D3DSIO_TEXCOORD:
  615. case D3DSIO_TEX:
  616. if( D3DSPR_TEXTURE != pSrcParam->m_RegType )
  617. break;
  618. // Verify that if a specific t# register is read more than once, each read uses the same source selector.
  619. if( s_bSeenTexcrdSrcSwizzle[pSrcParam->m_RegNum] )
  620. {
  621. // only check rgb swizzle (ignore a)
  622. if( (Swizzle & (0x3F << D3DVS_SWIZZLE_SHIFT)) != (s_TexcrdSrcSwizzle[pSrcParam->m_RegNum] & (0x3F << D3DVS_SWIZZLE_SHIFT) ))
  623. {
  624. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst,
  625. "Texture coordinate register t%d read more than once in shader with different source selector (swizzle). "\
  626. "Multiple reads of identical texture coordinate register throughout shader must all use identical source selector. "\
  627. "Note this does not restrict mixing use and non-use of a source modifier (i.e. _dw/_da or _dz/_db, depending what the swizzle allows) on these coordinate register reads.",
  628. pSrcParam->m_RegNum);
  629. m_ErrorCount++;
  630. bFoundSrcError = TRUE;
  631. }
  632. }
  633. s_bSeenTexcrdSrcSwizzle[pSrcParam->m_RegNum] = TRUE;
  634. s_TexcrdSrcSwizzle[pSrcParam->m_RegNum] = Swizzle;
  635. break;
  636. }
  637. }
  638. else // not a tex op
  639. {
  640. UINT ValidRegNum = 0;
  641. switch(pSrcParam->m_RegType)
  642. {
  643. case D3DSPR_INPUT:
  644. if( 1 == m_Phase )
  645. {
  646. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "%sInput registers (v#) are not available in phase 1 of the shader.", szSourceName);
  647. m_ErrorCount++;
  648. bFoundSrcError = TRUE;
  649. }
  650. else
  651. {
  652. ValidRegNum = m_pInputRegFile->GetNumRegs();
  653. }
  654. break;
  655. case D3DSPR_CONST: ValidRegNum = m_pConstRegFile->GetNumRegs(); break;
  656. case D3DSPR_TEMP: ValidRegNum = m_pTextureRegFile->GetNumRegs(); break;
  657. case D3DSPR_TEXTURE:
  658. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "%sTexture coordinate registers (t#) are not available to arithmetic instructions.", szSourceName);
  659. m_ErrorCount++;
  660. bFoundSrcError = TRUE;
  661. break;
  662. default:
  663. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "%sInvalid register type.", szSourceName);
  664. m_ErrorCount++;
  665. bFoundSrcError = TRUE;
  666. }
  667. if( (!bFoundSrcError) && (pSrcParam->m_RegNum >= ValidRegNum) )
  668. {
  669. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "%sInvalid register number: %d. Max allowed for this type is %d.",
  670. szSourceName, pSrcParam->m_RegNum, ValidRegNum - 1);
  671. m_ErrorCount++;
  672. bFoundSrcError = TRUE;
  673. }
  674. switch( pSrcParam->m_SrcMod )
  675. {
  676. case D3DSPSM_NONE:
  677. case D3DSPSM_NEG:
  678. case D3DSPSM_BIAS:
  679. case D3DSPSM_BIASNEG:
  680. case D3DSPSM_SIGN:
  681. case D3DSPSM_SIGNNEG:
  682. case D3DSPSM_COMP:
  683. case D3DSPSM_X2:
  684. case D3DSPSM_X2NEG:
  685. break;
  686. default:
  687. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "%sInvalid source modifier.",
  688. szSourceName);
  689. m_ErrorCount++;
  690. bFoundSrcError = TRUE;
  691. }
  692. switch( pSrcParam->m_SwizzleShift )
  693. {
  694. case D3DSP_NOSWIZZLE:
  695. case D3DSP_REPLICATERED:
  696. case D3DSP_REPLICATEGREEN:
  697. case D3DSP_REPLICATEBLUE:
  698. case D3DSP_REPLICATEALPHA:
  699. break;
  700. default:
  701. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "%sInvalid source selector.",
  702. szSourceName);
  703. m_ErrorCount++;
  704. bFoundSrcError = TRUE;
  705. }
  706. }
  707. LOOP_CONTINUE:
  708. if( bFoundSrcError )
  709. {
  710. m_bSrcParamError[i] = TRUE; // needed in Rule_SrcInitialized
  711. }
  712. }
  713. return TRUE;
  714. }
  715. //-----------------------------------------------------------------------------
  716. // CPShaderValidator14::Rule_LimitedUseOfProjModifier
  717. //
  718. // ** Rule:
  719. // _dz may only appear at most 2 times in shader.
  720. //
  721. // ** When to call:
  722. // Per instruction.
  723. //
  724. // ** Returns:
  725. // Always TRUE.
  726. //
  727. //-----------------------------------------------------------------------------
  728. BOOL CPShaderValidator14::Rule_LimitedUseOfProjModifier()
  729. {
  730. static UINT s_ProjZModifierCount;
  731. static BOOL s_bSpewedError;
  732. if( NULL == m_pCurrInst->m_pPrevInst ) // First instruction - initialize static vars
  733. {
  734. s_ProjZModifierCount = 0;
  735. s_bSpewedError = FALSE;
  736. }
  737. for( UINT i = 0; i < m_pCurrInst->m_SrcParamCount; i++ )
  738. {
  739. if( m_bSrcParamError[i] )
  740. continue;
  741. if( D3DSPSM_DZ == m_pCurrInst->m_SrcParam[i].m_SrcMod)
  742. {
  743. s_ProjZModifierCount++;
  744. }
  745. if( (2 < s_ProjZModifierCount) && (FALSE == s_bSpewedError) )
  746. {
  747. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "_dz(=_db) modifier may only be used at most 2 times in a shader." );
  748. s_bSpewedError = TRUE;
  749. m_ErrorCount++;
  750. }
  751. }
  752. return TRUE;
  753. }
  754. //-----------------------------------------------------------------------------
  755. // CPShaderValidator14::Rule_SrcInitialized
  756. //
  757. // ** Rule:
  758. // for each source parameter,
  759. // if source is a TEMP register then
  760. // the components flagged in the component read mask
  761. // (computed elsewhere) for the paramter must have been initialized
  762. //
  763. // When checking if a component has been written previously,
  764. // it must have been written in a previous cycle - so in the
  765. // case of co-issued instructions, initialization of a component
  766. // by one co-issued instruction is not available to the other for read.
  767. //
  768. // ** When to call:
  769. // Per instruction. This rule must be called before Rule_ValidDstParam().
  770. //
  771. // ** Returns:
  772. // Always TRUE.
  773. //
  774. // NOTE: This rule also updates the access history to indicate reads of the
  775. // affected components of each source register.
  776. //-----------------------------------------------------------------------------
  777. BOOL CPShaderValidator14::Rule_SrcInitialized()
  778. {
  779. DSTPARAM* pDstParam = &(m_pCurrInst->m_DstParam);
  780. BOOL bDestParamIsSrc = pDstParam->m_ComponentReadMask;
  781. UINT SrcParamCount = bDestParamIsSrc ? 1 : m_pCurrInst->m_SrcParamCount; // assumes if dest param is src,
  782. // there are no source params in instruction
  783. for( UINT i = 0; i < SrcParamCount; i++ )
  784. {
  785. DWORD UninitializedComponentsMask = 0;
  786. CAccessHistoryNode* pWriterInCurrCycle[4] = {0, 0, 0, 0};
  787. UINT NumUninitializedComponents = 0;
  788. UINT RegNum = bDestParamIsSrc ? pDstParam->m_RegNum : m_pCurrInst->m_SrcParam[i].m_RegNum;
  789. D3DSHADER_PARAM_REGISTER_TYPE Type = bDestParamIsSrc ? pDstParam->m_RegType : m_pCurrInst->m_SrcParam[i].m_RegType;
  790. DWORD ComponentReadMask = bDestParamIsSrc ? pDstParam->m_ComponentReadMask : m_pCurrInst->m_SrcParam[i].m_ComponentReadMask;
  791. CRegisterFile* pRegFile = NULL;
  792. char* RegChar = NULL;
  793. if( !bDestParamIsSrc && m_bSrcParamError[i] )
  794. continue;
  795. switch( Type )
  796. {
  797. case D3DSPR_TEMP:
  798. pRegFile = m_pTempRegFile;
  799. RegChar = "r";
  800. break;
  801. case D3DSPR_TEXTURE:
  802. pRegFile = m_pTextureRegFile;
  803. RegChar = "t";
  804. break;
  805. case D3DSPR_INPUT:
  806. pRegFile = m_pInputRegFile;
  807. RegChar = "v";
  808. break;
  809. case D3DSPR_CONST:
  810. pRegFile = m_pConstRegFile;
  811. RegChar = "c";
  812. break;
  813. }
  814. if( !pRegFile )
  815. continue;
  816. if( RegNum >= pRegFile->GetNumRegs() )
  817. continue;
  818. // check for read of uninitialized components
  819. if( D3DSPR_TEMP == Type ) // only bother doing this for temp regs, since everything else is initialized.
  820. {
  821. for( UINT Component = 0; Component < 4; Component++ )
  822. {
  823. if( !(ComponentReadMask & COMPONENT_MASKS[Component]) )
  824. continue;
  825. CAccessHistoryNode* pPreviousWriter = pRegFile->m_pAccessHistory[Component][RegNum].m_pMostRecentWriter;
  826. CBaseInstruction* pCurrInst = m_pCurrInst;
  827. // If co-issue, find the real previous writer.
  828. while( pPreviousWriter
  829. && ((CPSInstruction*)pPreviousWriter->m_pInst)->m_CycleNum == _CURR_PS_INST->m_CycleNum )
  830. {
  831. pWriterInCurrCycle[Component] = pPreviousWriter; // log read just before this write for co-issue
  832. pPreviousWriter = pPreviousWriter->m_pPreviousWriter;
  833. }
  834. // Even if pPreviousWriter == NULL, the component could have been initialized pre-shader.
  835. // So to check for initialization, we look at m_bInitialized below, rather than pPreviousWrite
  836. if(pPreviousWriter == NULL && !pRegFile->m_pAccessHistory[Component][RegNum].m_bPreShaderInitialized)
  837. {
  838. NumUninitializedComponents++;
  839. UninitializedComponentsMask |= COMPONENT_MASKS[Component];
  840. }
  841. }
  842. if( NumUninitializedComponents )
  843. {
  844. if( (UninitializedComponentsMask & COMPONENT_MASKS[3]) &&
  845. (m_TempRegsWithZappedAlpha & (1 << RegNum ) ) &&
  846. (UninitializedComponentsMask & COMPONENT_MASKS[2]) &&
  847. (m_TempRegsWithZappedBlue & (1 << RegNum ) ) )
  848. {
  849. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "Read of uninitialized component%s(*) in %s%d: %s. "\
  850. ZAPPED_BLUE_TEXT " Also: " ZAPPED_ALPHA_TEXT,
  851. NumUninitializedComponents > 1 ? "s" : "",
  852. RegChar, RegNum, MakeAffectedComponentsText(UninitializedComponentsMask,TRUE,TRUE));
  853. }
  854. else if( (UninitializedComponentsMask & COMPONENT_MASKS[3]) &&
  855. (m_TempRegsWithZappedAlpha & (1 << RegNum ) ) )
  856. {
  857. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "Read of uninitialized component%s(*) in %s%d: %s. "\
  858. ZAPPED_ALPHA_TEXT,
  859. NumUninitializedComponents > 1 ? "s" : "",
  860. RegChar, RegNum, MakeAffectedComponentsText(UninitializedComponentsMask,TRUE,TRUE));
  861. }
  862. else if( (UninitializedComponentsMask & COMPONENT_MASKS[2]) &&
  863. (m_TempRegsWithZappedBlue & (1 << RegNum ) ) )
  864. {
  865. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "Read of uninitialized component%s(*) in %s%d: %s. "\
  866. ZAPPED_BLUE_TEXT,
  867. NumUninitializedComponents > 1 ? "s" : "",
  868. RegChar, RegNum, MakeAffectedComponentsText(UninitializedComponentsMask,TRUE,TRUE));
  869. }
  870. else
  871. {
  872. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "Read of uninitialized component%s(*) in %s%d: %s",
  873. NumUninitializedComponents > 1 ? "s" : "",
  874. RegChar, RegNum, MakeAffectedComponentsText(UninitializedComponentsMask,TRUE,TRUE));
  875. }
  876. m_ErrorCount++;
  877. }
  878. }
  879. // Update register file to indicate READ.
  880. // Multiple reads of the same register component by the current instruction
  881. // will only be logged as one read in the access history.
  882. for( UINT Component = 0; Component < 4; Component++ )
  883. {
  884. #define PREV_READER(_CHAN,_REG) \
  885. ((NULL == pRegFile->m_pAccessHistory[_CHAN][_REG].m_pMostRecentReader) ? NULL :\
  886. pRegFile->m_pAccessHistory[_CHAN][_REG].m_pMostRecentReader->m_pInst)
  887. if( !(ComponentReadMask & COMPONENT_MASKS[Component]) )
  888. continue;
  889. if( NULL != pWriterInCurrCycle[Component] )
  890. {
  891. if( !pWriterInCurrCycle[Component]->m_pPreviousReader ||
  892. pWriterInCurrCycle[Component]->m_pPreviousReader->m_pInst != m_pCurrInst )
  893. {
  894. if( !pRegFile->m_pAccessHistory[Component][RegNum].InsertReadBeforeWrite(
  895. pWriterInCurrCycle[Component], m_pCurrInst ) )
  896. {
  897. Spew( SPEW_GLOBAL_ERROR, NULL, "Out of memory");
  898. m_ErrorCount++;
  899. }
  900. }
  901. }
  902. else if( PREV_READER(Component,RegNum) != m_pCurrInst )
  903. {
  904. if( !pRegFile->m_pAccessHistory[Component][RegNum].NewAccess(m_pCurrInst,FALSE) )
  905. {
  906. Spew( SPEW_GLOBAL_ERROR, NULL, "Out of memory");
  907. m_ErrorCount++;
  908. }
  909. }
  910. }
  911. }
  912. return TRUE;
  913. }
  914. //-----------------------------------------------------------------------------
  915. // CPShaderValidator14::Rule_MultipleDependentTextureReads
  916. //
  917. // ** Rule:
  918. //
  919. // Multiple dependent texture reads are disallowed. So texture read results
  920. // can be used as an address in a subsequent read, but the results from that
  921. // second read cannot be used as an address in yet another subsequent read.
  922. //
  923. // As pseudocode:
  924. //
  925. // if current instruction (x) is a tex-op that reads a texture
  926. // for each source param of x
  927. // if the register is a texture register
  928. // and there exists a previous writer (y),
  929. // and y is a tex op that reads a texture
  930. // if there exists a souce parameter of y that was previously
  931. // written by an instruction that reads a texture (z)
  932. // SPEW(Error)
  933. //
  934. // NOTE that it is assumed that tex ops must write to all components, so
  935. // only the read/write history for the R component is being checked.
  936. //
  937. // ** When to call:
  938. // Per instruction. This rule must be called before Rule_ValidDstParam(),
  939. // and Rule_SrcInitialized()
  940. // but after Rule_ValidSrcParams()
  941. //
  942. // ** Returns:
  943. // Always TRUE.
  944. //
  945. BOOL CPShaderValidator14::Rule_MultipleDependentTextureReads()
  946. {
  947. DSTPARAM* pDstParam = &(m_pCurrInst->m_DstParam);
  948. UINT DstRegNum = pDstParam->m_RegNum;
  949. char RegChar;
  950. #define THREE_TUPLE 3
  951. if( !_CURR_PS_INST->m_bTexOp )
  952. return TRUE;
  953. BOOL bDestParamIsSrc = pDstParam->m_ComponentReadMask;
  954. UINT SrcParamCount = bDestParamIsSrc ? 1 : m_pCurrInst->m_SrcParamCount; // assumes if dest param is src,
  955. // there are no source params in instruction
  956. if( D3DSPR_TEMP != pDstParam->m_RegType )
  957. return TRUE;
  958. for( UINT SrcParam = 0; SrcParam < SrcParamCount; SrcParam++ )
  959. {
  960. if( !bDestParamIsSrc && m_bSrcParamError[SrcParam] )
  961. continue;
  962. SRCPARAM* pSrcParam = bDestParamIsSrc ? NULL : &(m_pCurrInst->m_SrcParam[SrcParam]);
  963. UINT SrcRegNum = bDestParamIsSrc ? DstRegNum : pSrcParam->m_RegNum;
  964. CRegisterFile* pSrcRegFile = NULL;
  965. switch( bDestParamIsSrc ? pDstParam->m_RegType : pSrcParam->m_RegType )
  966. {
  967. case D3DSPR_TEMP:
  968. pSrcRegFile = m_pTempRegFile;
  969. RegChar = 'r';
  970. break;
  971. case D3DSPR_TEXTURE:
  972. pSrcRegFile = m_pTextureRegFile;
  973. RegChar = 't';
  974. break;
  975. }
  976. if( !pSrcRegFile )
  977. continue;
  978. if( SrcRegNum >= pSrcRegFile->GetNumRegs() )
  979. continue;
  980. for( UINT SrcComp = 0; SrcComp < THREE_TUPLE; SrcComp++ ) // Tex ops only read 3-tuples.
  981. {
  982. CAccessHistoryNode* pPreviousWriter = pSrcRegFile->m_pAccessHistory[SrcComp][SrcRegNum].m_pMostRecentWriter;
  983. CPSInstruction* pInst = pPreviousWriter ? (CPSInstruction*)pPreviousWriter->m_pInst : NULL;
  984. if( !pInst || !pInst->m_bTexOp )
  985. continue;
  986. // If the previous writer was in the current phase of the shader, spew an error.
  987. if( !m_pPhaseMarkerInst || (pInst->m_CycleNum > m_pPhaseMarkerInst->m_CycleNum) )
  988. {
  989. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst,
  990. "The current tex* instruction reads from %c%d, which was written earlier by another "\
  991. "tex* instruction in the same block of tex* instructions. Dependent reads "\
  992. "are not permitted within a single block of tex* instructions. To perform a dependent read, "\
  993. "separate texture coordinate derivation from the tex* instruction using the coordinates "\
  994. "with a 'phase' marker.",
  995. RegChar,SrcRegNum );
  996. m_ErrorCount++;
  997. return TRUE; // Lets only spew this warning once per instruction.
  998. }
  999. }
  1000. }
  1001. return TRUE;
  1002. }
  1003. //-----------------------------------------------------------------------------
  1004. // CPShaderValidator14::Rule_ValidDstParam
  1005. //
  1006. // ** Rule:
  1007. // I instruction is D3DSIO_DEF, then do nothing - this case has its own separate rule
  1008. // The dst register must be writable.
  1009. // If the instruction has a dest parameter (i.e. every instruction except NOP), then
  1010. // the dst register must be of type D3DSPR_TEXTURE, and
  1011. // register # must be within range
  1012. // if instruction is a texture instruction, then
  1013. // the dst register must be of type D3DSPR_TEMP, and
  1014. // the writemask must be D3DSP_WRITEMASK_ALL
  1015. // or (.rgb for texcrd, .rg for texcrd with _dw source mod), and
  1016. // the dst modifier must be D3DSPDM_NONE (or _SAT on version > 1.1), and
  1017. // the dst shift must be none
  1018. // else (non tex instruction)
  1019. // the dst modifier must be D3DSPDM_NONE or _SATURATE, and
  1020. // dst shift must be /2, none, *2, or *4
  1021. //
  1022. // ** When to call:
  1023. // Per instruction.
  1024. //
  1025. // ** Returns:
  1026. // Always TRUE.
  1027. //
  1028. // NOTE: After checking the dst parameter, if no error was found,
  1029. // the write to the appropriate component(s) of the destination register
  1030. // is recorded by this function, so subsequent rules may check for previous
  1031. // write to registers.
  1032. //-----------------------------------------------------------------------------
  1033. BOOL CPShaderValidator14::Rule_ValidDstParam() // could break this down for more granularity
  1034. {
  1035. BOOL bFoundDstError = FALSE;
  1036. DSTPARAM* pDstParam = &(m_pCurrInst->m_DstParam);
  1037. UINT RegNum = pDstParam->m_RegNum;
  1038. if( D3DSIO_DEF == m_pCurrInst->m_Type )
  1039. {
  1040. // _DEF is a special instruction whose dest is a const register.
  1041. // We do the checking for this in a separate function.
  1042. // Also, we don't need to keep track of the fact that
  1043. // this instruction wrote to a register (done below),
  1044. // since _DEF just declares a constant.
  1045. return TRUE;
  1046. }
  1047. if( pDstParam->m_bParamUsed )
  1048. {
  1049. UINT ValidRegNum = 0;
  1050. BOOL bWritingToDest = TRUE;
  1051. switch( pDstParam->m_RegType )
  1052. {
  1053. case D3DSPR_TEMP:
  1054. ValidRegNum = m_pTempRegFile->GetNumRegs();
  1055. break;
  1056. case D3DSPR_TEXTURE:
  1057. ValidRegNum = m_pTempRegFile->GetNumRegs();
  1058. break;
  1059. }
  1060. if( D3DSIO_TEXKILL == m_pCurrInst->m_Type )
  1061. {
  1062. bWritingToDest = FALSE;
  1063. }
  1064. if( 0 == ValidRegNum ||
  1065. (D3DSPR_TEXTURE == pDstParam->m_RegType && bWritingToDest) )
  1066. {
  1067. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "Invalid register type for destination param." );
  1068. m_ErrorCount++;
  1069. bFoundDstError = TRUE;
  1070. }
  1071. else if( RegNum >= ValidRegNum )
  1072. {
  1073. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "Invalid destination register number: %d. Max allowed for this register type is %d.",
  1074. RegNum, ValidRegNum - 1);
  1075. m_ErrorCount++;
  1076. bFoundDstError = TRUE;
  1077. }
  1078. if( _CURR_PS_INST->m_bTexOp )
  1079. {
  1080. switch( m_pCurrInst->m_Type )
  1081. {
  1082. case D3DSIO_TEXCOORD:
  1083. if( D3DSPSM_DW == m_pCurrInst->m_SrcParam[0].m_SrcMod )
  1084. {
  1085. if( (D3DSP_WRITEMASK_0 | D3DSP_WRITEMASK_1) != pDstParam->m_WriteMask )
  1086. {
  1087. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "texcrd with _dw(=_da) source modifier must use .xy(=.rg) destination writemask.");
  1088. m_ErrorCount++;
  1089. bFoundDstError = TRUE;
  1090. }
  1091. }
  1092. else
  1093. {
  1094. if( (D3DSP_WRITEMASK_0 | D3DSP_WRITEMASK_1 | D3DSP_WRITEMASK_2) != pDstParam->m_WriteMask )
  1095. {
  1096. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "texcrd must use .xyz(=.rgb) destination writemask.");
  1097. m_ErrorCount++;
  1098. bFoundDstError = TRUE;
  1099. }
  1100. }
  1101. break;
  1102. case D3DSIO_TEX:
  1103. case D3DSIO_TEXKILL:
  1104. case D3DSIO_TEXDEPTH:
  1105. if( D3DSP_WRITEMASK_ALL != pDstParam->m_WriteMask )
  1106. {
  1107. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "texld/texkill/texdepth instructions must write all components." );
  1108. m_ErrorCount++;
  1109. bFoundDstError = TRUE;
  1110. }
  1111. break;
  1112. }
  1113. switch( pDstParam->m_DstMod )
  1114. {
  1115. case D3DSPDM_NONE:
  1116. break;
  1117. default:
  1118. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "Instruction modifiers not allowed for tex* instructions." );
  1119. m_ErrorCount++;
  1120. bFoundDstError = TRUE;
  1121. }
  1122. switch( pDstParam->m_DstShift )
  1123. {
  1124. case DSTSHIFT_NONE:
  1125. break;
  1126. default:
  1127. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "Destination shift not allowed for tex* instructions." );
  1128. m_ErrorCount++;
  1129. bFoundDstError = TRUE;
  1130. }
  1131. }
  1132. else
  1133. {
  1134. switch( pDstParam->m_DstMod )
  1135. {
  1136. case D3DSPDM_NONE:
  1137. case D3DSPDM_SATURATE:
  1138. break;
  1139. default:
  1140. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "Invalid instruction modifier." );
  1141. m_ErrorCount++;
  1142. bFoundDstError = TRUE;
  1143. }
  1144. switch( pDstParam->m_DstShift )
  1145. {
  1146. case DSTSHIFT_NONE:
  1147. case DSTSHIFT_X2:
  1148. case DSTSHIFT_X4:
  1149. case DSTSHIFT_X8:
  1150. case DSTSHIFT_D2:
  1151. case DSTSHIFT_D4:
  1152. case DSTSHIFT_D8:
  1153. break;
  1154. default:
  1155. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "Invalid destination shift." );
  1156. m_ErrorCount++;
  1157. bFoundDstError = TRUE;
  1158. }
  1159. }
  1160. // Update register file to indicate write.
  1161. if( !bFoundDstError && bWritingToDest)
  1162. {
  1163. CRegisterFile* pRegFile = NULL;
  1164. DWORD WriteMask = pDstParam->m_WriteMask;
  1165. switch( pDstParam->m_RegType )
  1166. {
  1167. case D3DSPR_TEMP: pRegFile = m_pTempRegFile; break;
  1168. }
  1169. if( pRegFile )
  1170. {
  1171. if( WriteMask & D3DSP_WRITEMASK_0 )
  1172. pRegFile->m_pAccessHistory[0][RegNum].NewAccess(m_pCurrInst,TRUE);
  1173. if( WriteMask & D3DSP_WRITEMASK_1 )
  1174. pRegFile->m_pAccessHistory[1][RegNum].NewAccess(m_pCurrInst,TRUE);
  1175. if( WriteMask & D3DSP_WRITEMASK_2 )
  1176. pRegFile->m_pAccessHistory[2][RegNum].NewAccess(m_pCurrInst,TRUE);
  1177. else if( D3DSIO_TEXCOORD == m_pCurrInst->m_Type )
  1178. {
  1179. // texcrd without b writemask uninitializes b channel.
  1180. // alpha also gets uninitialized, but phase marker alpha-nuke takes care of that anyway,
  1181. // and if the texcrd was in the first phase, noone could have written to the register
  1182. // so there would be nothing to nuke.
  1183. if( pRegFile->m_pAccessHistory[2][RegNum].m_pMostRecentWriter )
  1184. {
  1185. m_pTempRegFile->m_pAccessHistory[2][RegNum].~CAccessHistory();
  1186. m_pTempRegFile->m_pAccessHistory[2][RegNum].CAccessHistory::CAccessHistory();
  1187. m_TempRegsWithZappedBlue |= 1 << RegNum;
  1188. }
  1189. }
  1190. if( WriteMask & D3DSP_WRITEMASK_3 )
  1191. pRegFile->m_pAccessHistory[3][RegNum].NewAccess(m_pCurrInst,TRUE);
  1192. }
  1193. }
  1194. }
  1195. return TRUE;
  1196. }
  1197. //-----------------------------------------------------------------------------
  1198. // CPShaderValidator14::Rule_ValidRegisterPortUsage
  1199. //
  1200. // ** Rule:
  1201. // Each register class (TEXTURE,INPUT,CONST) may only appear as parameters
  1202. // in an individual instruction up to a maximum number of times.
  1203. //
  1204. // Multiple accesses to the same register number (in the same register class)
  1205. // only count as one access.
  1206. //
  1207. // ** When to call:
  1208. // Per instruction.
  1209. //
  1210. // ** Returns:
  1211. // Always TRUE.
  1212. //
  1213. //-----------------------------------------------------------------------------
  1214. BOOL CPShaderValidator14::Rule_ValidRegisterPortUsage()
  1215. {
  1216. UINT i, j;
  1217. UINT TempRegPortUsage[SHADER_INSTRUCTION_MAX_SRCPARAMS];
  1218. UINT InputRegPortUsage[SHADER_INSTRUCTION_MAX_SRCPARAMS];
  1219. UINT ConstRegPortUsage[SHADER_INSTRUCTION_MAX_SRCPARAMS];
  1220. UINT TextureRegPortUsage[SHADER_INSTRUCTION_MAX_SRCPARAMS];
  1221. UINT NumUniqueTempRegs = 0;
  1222. UINT NumUniqueInputRegs = 0;
  1223. UINT NumUniqueConstRegs = 0;
  1224. UINT NumUniqueTextureRegs = 0;
  1225. D3DSHADER_PARAM_REGISTER_TYPE RegType;
  1226. UINT RegNum;
  1227. static UINT s_TempRegPortUsageAcrossCoIssue[SHADER_INSTRUCTION_MAX_SRCPARAMS*2];
  1228. static UINT s_InputRegPortUsageAcrossCoIssue[SHADER_INSTRUCTION_MAX_SRCPARAMS*2];
  1229. static UINT s_ConstRegPortUsageAcrossCoIssue[SHADER_INSTRUCTION_MAX_SRCPARAMS*2];
  1230. static UINT s_TextureRegPortUsageAcrossCoIssue[SHADER_INSTRUCTION_MAX_SRCPARAMS*2];
  1231. static UINT s_NumUniqueTempRegsAcrossCoIssue;
  1232. static UINT s_NumUniqueInputRegsAcrossCoIssue;
  1233. static UINT s_NumUniqueConstRegsAcrossCoIssue;
  1234. static UINT s_NumUniqueTextureRegsAcrossCoIssue;
  1235. if( NULL == m_pCurrInst->m_pPrevInst ) // First instruction - initialize static vars
  1236. {
  1237. s_NumUniqueTempRegsAcrossCoIssue = 0;
  1238. s_NumUniqueInputRegsAcrossCoIssue = 0;
  1239. s_NumUniqueConstRegsAcrossCoIssue = 0;
  1240. s_NumUniqueTextureRegsAcrossCoIssue = 0;
  1241. }
  1242. for( i = 0; i < m_pCurrInst->m_SrcParamCount; i++ )
  1243. {
  1244. UINT* pRegPortUsage = NULL;
  1245. UINT* pNumUniqueRegs = NULL;
  1246. RegType = m_pCurrInst->m_SrcParam[i].m_RegType;
  1247. RegNum = m_pCurrInst->m_SrcParam[i].m_RegNum;
  1248. switch( RegType )
  1249. {
  1250. case D3DSPR_TEMP:
  1251. pRegPortUsage = TempRegPortUsage;
  1252. pNumUniqueRegs = &NumUniqueTempRegs;
  1253. break;
  1254. case D3DSPR_INPUT:
  1255. pRegPortUsage = InputRegPortUsage;
  1256. pNumUniqueRegs = &NumUniqueInputRegs;
  1257. break;
  1258. case D3DSPR_CONST:
  1259. pRegPortUsage = ConstRegPortUsage;
  1260. pNumUniqueRegs = &NumUniqueConstRegs;
  1261. break;
  1262. case D3DSPR_TEXTURE:
  1263. pRegPortUsage = TextureRegPortUsage;
  1264. pNumUniqueRegs = &NumUniqueTextureRegs;
  1265. break;
  1266. }
  1267. if( !pRegPortUsage ) continue;
  1268. BOOL bRegAlreadyAccessed = FALSE;
  1269. for( j = 0; j < *pNumUniqueRegs; j++ )
  1270. {
  1271. if( pRegPortUsage[j] == RegNum )
  1272. {
  1273. bRegAlreadyAccessed = TRUE;
  1274. break;
  1275. }
  1276. }
  1277. if( !bRegAlreadyAccessed )
  1278. {
  1279. pRegPortUsage[*pNumUniqueRegs] = RegNum;
  1280. (*pNumUniqueRegs)++;
  1281. }
  1282. }
  1283. if( NumUniqueTempRegs > m_pTempRegFile->GetNumReadPorts() )
  1284. {
  1285. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "%d different temp registers (r#) read by instruction. Max. different temp registers readable per instruction is %d.",
  1286. NumUniqueTempRegs, m_pTempRegFile->GetNumReadPorts());
  1287. m_ErrorCount++;
  1288. }
  1289. if( NumUniqueInputRegs > m_pInputRegFile->GetNumReadPorts() )
  1290. {
  1291. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "%d different input registers (v#) read by instruction. Max. different input registers readable per instruction is %d.",
  1292. NumUniqueInputRegs, m_pInputRegFile->GetNumReadPorts());
  1293. m_ErrorCount++;
  1294. }
  1295. if( NumUniqueConstRegs > m_pConstRegFile->GetNumReadPorts() )
  1296. {
  1297. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "%d different constant registers (c#) read by instruction. Max. different constant registers readable per instruction is %d.",
  1298. NumUniqueConstRegs, m_pConstRegFile->GetNumReadPorts());
  1299. m_ErrorCount++;
  1300. }
  1301. if( NumUniqueTextureRegs > m_pTextureRegFile->GetNumReadPorts() )
  1302. {
  1303. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "%d different texture coordinate registers (t#) read by instruction. Max. different texture registers readable per instruction is %d.",
  1304. NumUniqueTextureRegs, m_pTextureRegFile->GetNumReadPorts());
  1305. m_ErrorCount++;
  1306. }
  1307. // Read port limit for different register numbers of any one register type across co-issued instructions is MAX_READPORTS_ACROSS_COISSUE total.
  1308. if( _CURR_PS_INST->m_bCoIssue && _PREV_PS_INST && !(_PREV_PS_INST->m_bCoIssue)) // second 2 clauses are just a simple sanity check -> co-issue only involved 2 instructions.
  1309. {
  1310. for( i = 0; i < m_pCurrInst->m_SrcParamCount; i++ )
  1311. {
  1312. UINT* pRegPortUsageAcrossCoIssue = NULL;
  1313. UINT* pNumUniqueRegsAcrossCoIssue = NULL;
  1314. RegType = m_pCurrInst->m_SrcParam[i].m_RegType;
  1315. RegNum = m_pCurrInst->m_SrcParam[i].m_RegNum;
  1316. switch( RegType )
  1317. {
  1318. case D3DSPR_TEMP:
  1319. pRegPortUsageAcrossCoIssue = s_TempRegPortUsageAcrossCoIssue;
  1320. pNumUniqueRegsAcrossCoIssue = &s_NumUniqueTempRegsAcrossCoIssue;
  1321. break;
  1322. case D3DSPR_INPUT:
  1323. pRegPortUsageAcrossCoIssue = s_InputRegPortUsageAcrossCoIssue;
  1324. pNumUniqueRegsAcrossCoIssue = &s_NumUniqueInputRegsAcrossCoIssue;
  1325. break;
  1326. case D3DSPR_CONST:
  1327. pRegPortUsageAcrossCoIssue = s_ConstRegPortUsageAcrossCoIssue;
  1328. pNumUniqueRegsAcrossCoIssue = &s_NumUniqueConstRegsAcrossCoIssue;
  1329. break;
  1330. case D3DSPR_TEXTURE:
  1331. pRegPortUsageAcrossCoIssue = s_TextureRegPortUsageAcrossCoIssue;
  1332. pNumUniqueRegsAcrossCoIssue = &s_NumUniqueTextureRegsAcrossCoIssue;
  1333. break;
  1334. }
  1335. if( !pRegPortUsageAcrossCoIssue ) continue;
  1336. BOOL bRegAlreadyAccessed = FALSE;
  1337. for( j = 0; j < *pNumUniqueRegsAcrossCoIssue; j++ )
  1338. {
  1339. if( pRegPortUsageAcrossCoIssue[j] == RegNum )
  1340. {
  1341. bRegAlreadyAccessed = TRUE;
  1342. break;
  1343. }
  1344. }
  1345. if( !bRegAlreadyAccessed )
  1346. {
  1347. pRegPortUsageAcrossCoIssue[*pNumUniqueRegsAcrossCoIssue] = RegNum;
  1348. (*pNumUniqueRegsAcrossCoIssue)++;
  1349. }
  1350. }
  1351. #define MAX_READPORTS_ACROSS_COISSUE 3
  1352. if( s_NumUniqueTempRegsAcrossCoIssue > MAX_READPORTS_ACROSS_COISSUE )
  1353. {
  1354. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst,
  1355. "%d different temp registers (r#) read over 2 co-issued instructions. "\
  1356. "Max. different register numbers from any one register type readable across co-issued instructions is %d.",
  1357. s_NumUniqueTempRegsAcrossCoIssue, MAX_READPORTS_ACROSS_COISSUE);
  1358. m_ErrorCount++;
  1359. }
  1360. if( s_NumUniqueInputRegsAcrossCoIssue > MAX_READPORTS_ACROSS_COISSUE )
  1361. {
  1362. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst,
  1363. "%d different input registers (v#) read over 2 co-issued instructions. "\
  1364. "Max. different register numbers from any one register type readable across co-issued instructions is %d.",
  1365. s_NumUniqueInputRegsAcrossCoIssue, MAX_READPORTS_ACROSS_COISSUE);
  1366. m_ErrorCount++;
  1367. }
  1368. if( s_NumUniqueConstRegsAcrossCoIssue > MAX_READPORTS_ACROSS_COISSUE )
  1369. {
  1370. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst,
  1371. "%d different constant registers (c#) read over 2 co-issued instructions. "\
  1372. "Max. different register numbers from any one register type readable across co-issued instructions is %d.",
  1373. s_NumUniqueConstRegsAcrossCoIssue, MAX_READPORTS_ACROSS_COISSUE);
  1374. m_ErrorCount++;
  1375. }
  1376. if( s_NumUniqueTextureRegsAcrossCoIssue > MAX_READPORTS_ACROSS_COISSUE )
  1377. {
  1378. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst,
  1379. "%d different texture coordinate registers (t#) read over 2 co-issued instructions. "\
  1380. "Max. different register numbers from any one register type readable across co-issued instructions is %d.",
  1381. s_NumUniqueTextureRegsAcrossCoIssue, MAX_READPORTS_ACROSS_COISSUE);
  1382. m_ErrorCount++;
  1383. }
  1384. }
  1385. if( !_CURR_PS_INST->m_bCoIssue )
  1386. {
  1387. // Copy all state to static vars so that in case next instruction is co-issued with this one,
  1388. // cross-coissue read port limit of 3 can be enforced.
  1389. memcpy(&s_TempRegPortUsageAcrossCoIssue,&TempRegPortUsage,NumUniqueTempRegs*sizeof(UINT));
  1390. memcpy(&s_InputRegPortUsageAcrossCoIssue,&InputRegPortUsage,NumUniqueInputRegs*sizeof(UINT));
  1391. memcpy(&s_ConstRegPortUsageAcrossCoIssue,&ConstRegPortUsage,NumUniqueConstRegs*sizeof(UINT));
  1392. memcpy(&s_TextureRegPortUsageAcrossCoIssue,&TextureRegPortUsage,NumUniqueTextureRegs*sizeof(UINT));
  1393. s_NumUniqueTempRegsAcrossCoIssue = NumUniqueTempRegs;
  1394. s_NumUniqueInputRegsAcrossCoIssue = NumUniqueInputRegs;
  1395. s_NumUniqueConstRegsAcrossCoIssue = NumUniqueConstRegs;
  1396. s_NumUniqueTextureRegsAcrossCoIssue = NumUniqueTextureRegs;
  1397. }
  1398. else
  1399. {
  1400. // reset counts because the next instruction cannot be co-issued with this one.
  1401. s_NumUniqueTempRegsAcrossCoIssue = 0;
  1402. s_NumUniqueInputRegsAcrossCoIssue = 0;
  1403. s_NumUniqueConstRegsAcrossCoIssue = 0;
  1404. s_NumUniqueTextureRegsAcrossCoIssue = 0;
  1405. }
  1406. return TRUE;
  1407. }
  1408. //-----------------------------------------------------------------------------
  1409. // CPShaderValidator14::Rule_ValidTexOpStageAndRegisterUsage
  1410. //
  1411. // ** Rule:
  1412. //
  1413. // ** When to call:
  1414. // Per instruction.
  1415. //
  1416. // ** Returns:
  1417. // Always TRUE.
  1418. //
  1419. //-----------------------------------------------------------------------------
  1420. BOOL CPShaderValidator14::Rule_ValidTexOpStageAndRegisterUsage()
  1421. {
  1422. static DWORD s_RegUsed; // bitfield representing if a retister has been used as a destination in this block of tex ops.
  1423. if( NULL == m_pCurrInst->m_pPrevInst ) // First instruction - initialize static vars
  1424. {
  1425. s_RegUsed = 0;
  1426. }
  1427. else if( D3DSIO_PHASE == m_pCurrInst->m_Type )
  1428. {
  1429. s_RegUsed = 0;
  1430. }
  1431. if( !_CURR_PS_INST->m_bTexOp )
  1432. return TRUE;
  1433. if( D3DSPR_TEMP != m_pCurrInst->m_DstParam.m_RegType )
  1434. return TRUE;
  1435. UINT RegNum = m_pCurrInst->m_DstParam.m_RegNum;
  1436. if( RegNum >= m_pTempRegFile->GetNumRegs() )
  1437. return TRUE; // error spewed elsewhere
  1438. if( s_RegUsed & (1<<RegNum) )
  1439. {
  1440. if( 1 == m_Phase )
  1441. {
  1442. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst,
  1443. "Register r%d (and thus texture stage %d) already used as a destination for a tex* instruction in this block of the shader. "\
  1444. "Second use of this register as a tex* destination is only available after the phase marker. ",
  1445. RegNum, RegNum );
  1446. }
  1447. else // 2 == m_Phase
  1448. {
  1449. if( m_bPhaseMarkerInShader )
  1450. {
  1451. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst,
  1452. "Register r%d (and thus texture stage %d) already used as a destination for a tex* instruction in this block of the shader. "\
  1453. "An r# register may be used as the destination for a tex* instruction at most once before the phase marker and once after. ",
  1454. RegNum, RegNum );
  1455. }
  1456. else // no phase marker present. Different spew to indicate
  1457. {
  1458. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst,
  1459. "Register r%d (and thus texture stage %d) already used as a destination for a tex* instruction in this block of the shader. "\
  1460. "To perform two tex* instructions with the same destination register, they must be separated by inserting a phase marker. ",
  1461. RegNum, RegNum );
  1462. }
  1463. }
  1464. m_ErrorCount++;
  1465. return TRUE;
  1466. }
  1467. s_RegUsed |= (1<<RegNum);
  1468. return TRUE;
  1469. }
  1470. //-----------------------------------------------------------------------------
  1471. // CPShaderValidator14::Rule_TexOpAfterArithmeticOp
  1472. //
  1473. // ** Rule:
  1474. // Tex ops (see IsTexOp() for which instructions are considered tex ops)
  1475. // must appear before any other instruction, with the exception of DEF or NOP.
  1476. //
  1477. // ** When to call:
  1478. // Per instruction.
  1479. //
  1480. // ** Returns:
  1481. // Always TRUE.
  1482. //
  1483. //-----------------------------------------------------------------------------
  1484. BOOL CPShaderValidator14::Rule_TexOpAfterArithmeticOp()
  1485. {
  1486. static BOOL s_bSeenArithmeticOp;
  1487. static BOOL s_bRuleDisabled;
  1488. if( NULL == m_pCurrInst->m_pPrevInst ) // First instruction - initialize static vars
  1489. {
  1490. s_bSeenArithmeticOp = FALSE;
  1491. }
  1492. if( !(_CURR_PS_INST->m_bTexOp)
  1493. && (D3DSIO_NOP != m_pCurrInst->m_Type)
  1494. && (D3DSIO_DEF != m_pCurrInst->m_Type)
  1495. && (D3DSIO_PHASE != m_pCurrInst->m_Type) )
  1496. {
  1497. s_bSeenArithmeticOp = TRUE;
  1498. return TRUE;
  1499. }
  1500. if( D3DSIO_PHASE == m_pCurrInst->m_Type )
  1501. {
  1502. s_bSeenArithmeticOp = FALSE; // reset flag because we are in new phase of shader.
  1503. return TRUE;
  1504. }
  1505. if( _CURR_PS_INST->m_bTexOp && s_bSeenArithmeticOp )
  1506. {
  1507. if( m_bPhaseMarkerInShader )
  1508. {
  1509. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "tex* instructions cannot be after arithmetic instructions "\
  1510. "within one phase of the shader. Each phase can have a block of "\
  1511. "tex* instructions followed by a block of arithmetic instructions. " );
  1512. }
  1513. else
  1514. {
  1515. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "tex* instructions cannot be after arithmetic instructions. "\
  1516. "The exception is if a phase marker is present in the shader - "\
  1517. "this separates a shader into two phases. Each phase may have "\
  1518. "a set of tex* instructions followed by a set of arithmetic instructions. " );
  1519. }
  1520. m_ErrorCount++;
  1521. s_bRuleDisabled = TRUE;
  1522. }
  1523. return TRUE;
  1524. }
  1525. //-----------------------------------------------------------------------------
  1526. // CPShaderValidator14::Rule_ValidMarker
  1527. //
  1528. // ** Rule:
  1529. //
  1530. // ** When to call:
  1531. // Per instruction.
  1532. //
  1533. // ** Returns:
  1534. // FALSE if more than one marker encountered. Else TRUE
  1535. //
  1536. //-----------------------------------------------------------------------------
  1537. BOOL CPShaderValidator14::Rule_ValidMarker()
  1538. {
  1539. static BOOL s_bSeenMarker;
  1540. if( NULL == m_pCurrInst->m_pPrevInst ) // First instruction - initialize static vars
  1541. {
  1542. s_bSeenMarker = FALSE;
  1543. }
  1544. if( D3DSIO_PHASE != m_pCurrInst->m_Type )
  1545. return TRUE;
  1546. if( s_bSeenMarker )
  1547. {
  1548. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "Multiple phase markers not permitted. Aborting shader validation." );
  1549. m_ErrorCount++;
  1550. return FALSE;
  1551. }
  1552. s_bSeenMarker = TRUE;
  1553. m_pPhaseMarkerInst = (CPSInstruction*)m_pCurrInst;
  1554. m_Phase++;
  1555. // Loop through all temp registers and nuke alpha access history (if any).
  1556. // Remember what we nuked, so if the shader tries to read one of these nuked alphas, we
  1557. // can debug spew that certain hardware is wacko and can't help but commit this atrocity.
  1558. for( UINT i = 0; i < m_pTempRegFile->GetNumRegs(); i++ )
  1559. {
  1560. if( m_pTempRegFile->m_pAccessHistory[3][i].m_pMostRecentWriter )
  1561. {
  1562. m_pTempRegFile->m_pAccessHistory[3][i].~CAccessHistory();
  1563. m_pTempRegFile->m_pAccessHistory[3][i].CAccessHistory::CAccessHistory();
  1564. m_TempRegsWithZappedAlpha |= 1 << i;
  1565. }
  1566. }
  1567. return TRUE;
  1568. }
  1569. //-----------------------------------------------------------------------------
  1570. // CPShaderValidator14::Rule_ValidTEXKILLInstruction
  1571. //
  1572. // ** Rule:
  1573. // texkill may only be present in phase 2
  1574. //
  1575. // ** When to call:
  1576. // Per instruction.
  1577. //
  1578. // ** Returns:
  1579. // Always TRUE.
  1580. //
  1581. //-----------------------------------------------------------------------------
  1582. BOOL CPShaderValidator14::Rule_ValidTEXKILLInstruction()
  1583. {
  1584. if( (D3DSIO_TEXKILL == m_pCurrInst->m_Type) && (1 == m_Phase))
  1585. {
  1586. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "When a phase marker is present in a shader, texkill is only permitted after the phase marker." );
  1587. m_ErrorCount++;
  1588. }
  1589. return TRUE;
  1590. }
  1591. //-----------------------------------------------------------------------------
  1592. // CPShaderValidator14::Rule_ValidBEMInstruction
  1593. //
  1594. // ** Rule:
  1595. // bem must have writemask .r, .g or .rg
  1596. // bem may only be present once in a shader, in phase 1.
  1597. //
  1598. // ** When to call:
  1599. // Per instruction.
  1600. //
  1601. // ** Returns:
  1602. // Always TRUE.
  1603. //
  1604. //-----------------------------------------------------------------------------
  1605. BOOL CPShaderValidator14::Rule_ValidBEMInstruction()
  1606. {
  1607. static BOOL s_bSeenBem;
  1608. if( NULL == m_pCurrInst->m_pPrevInst ) // First instruction - initialize static vars
  1609. {
  1610. s_bSeenBem = FALSE;
  1611. }
  1612. if( (D3DSIO_BEM == m_pCurrInst->m_Type))
  1613. {
  1614. if( s_bSeenBem )
  1615. {
  1616. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "bem may only be used once in a shader." );
  1617. m_ErrorCount++;
  1618. }
  1619. if( 2 == m_Phase )
  1620. {
  1621. if( m_bPhaseMarkerInShader )
  1622. {
  1623. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "bem may only be used before the phase marker." );
  1624. }
  1625. else
  1626. {
  1627. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "To use bem, a phase marker must be present later in the shader." );
  1628. }
  1629. m_ErrorCount++;
  1630. }
  1631. if( m_pCurrInst->m_DstParam.m_WriteMask != (D3DSP_WRITEMASK_0 | D3DSP_WRITEMASK_1))
  1632. {
  1633. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "Writemask for bem must be '.rg'" );
  1634. m_ErrorCount++;
  1635. }
  1636. for( UINT i = 0; i < m_pCurrInst->m_SrcParamCount; i++ )
  1637. {
  1638. SRCPARAM* pSrcParam = &(m_pCurrInst->m_SrcParam[i]);
  1639. if(m_bSrcParamError[i])
  1640. continue;
  1641. if( 0 == i )
  1642. {
  1643. if( (D3DSPR_TEMP != pSrcParam->m_RegType) &&
  1644. (D3DSPR_CONST != pSrcParam->m_RegType) )
  1645. {
  1646. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "First source parameter for bem must be temp (r#) or constant (c#) register." );
  1647. m_ErrorCount++;
  1648. }
  1649. }
  1650. else if( 1 == i )
  1651. {
  1652. if( (D3DSPR_TEMP != pSrcParam->m_RegType ) )
  1653. {
  1654. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "Second source parameter for bem must be temp (r#) register." );
  1655. m_ErrorCount++;
  1656. }
  1657. }
  1658. }
  1659. }
  1660. return TRUE;
  1661. }
  1662. //-----------------------------------------------------------------------------
  1663. // CPShaderValidator14::Rule_ValidTEXDEPTHInstruction
  1664. //
  1665. // ** Rule:
  1666. // texdepth must operate on r5.
  1667. // texdepth may only be present after a phase marker.
  1668. // texdepth may only be used once.
  1669. // Once texdepth has been used in a shader, r5 is no longer available
  1670. //
  1671. // ** When to call:
  1672. // Per instruction.
  1673. //
  1674. // ** Returns:
  1675. // Always TRUE.
  1676. //
  1677. //-----------------------------------------------------------------------------
  1678. BOOL CPShaderValidator14::Rule_ValidTEXDEPTHInstruction()
  1679. {
  1680. static BOOL s_bSeenTexDepth;
  1681. if( NULL == m_pCurrInst->m_pPrevInst ) // First instruction - initialize static vars
  1682. {
  1683. s_bSeenTexDepth = FALSE;
  1684. }
  1685. if( D3DSIO_TEXDEPTH == m_pCurrInst->m_Type )
  1686. {
  1687. if( s_bSeenTexDepth )
  1688. {
  1689. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "Only one use of texdepth is permitted." );
  1690. m_ErrorCount++;
  1691. return TRUE;
  1692. }
  1693. s_bSeenTexDepth = TRUE;
  1694. DSTPARAM* pDstParam = &m_pCurrInst->m_DstParam;
  1695. if( (5 != pDstParam->m_RegNum) || (D3DSPR_TEMP != pDstParam->m_RegType) )
  1696. {
  1697. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "Destination for texdepth must be r5." );
  1698. m_ErrorCount++;
  1699. }
  1700. if( (D3DSIO_TEXDEPTH == m_pCurrInst->m_Type) && (1 == m_Phase))
  1701. {
  1702. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "When a phase marker is present in a shader, texdepth is only permitted after the phase marker." );
  1703. m_ErrorCount++;
  1704. }
  1705. }
  1706. else if( s_bSeenTexDepth )
  1707. {
  1708. UINT RegNum;
  1709. D3DSHADER_PARAM_REGISTER_TYPE RegType;
  1710. for( UINT i = 0; i <= m_pCurrInst->m_SrcParamCount; i++ )
  1711. {
  1712. if( m_pCurrInst->m_SrcParamCount == i )
  1713. {
  1714. RegNum = m_pCurrInst->m_DstParam.m_RegNum;
  1715. RegType = m_pCurrInst->m_DstParam.m_RegType;
  1716. }
  1717. else
  1718. {
  1719. RegNum = m_pCurrInst->m_SrcParam[i].m_RegNum;
  1720. RegType = m_pCurrInst->m_SrcParam[i].m_RegType;
  1721. }
  1722. if( (5 == RegNum) && (D3DSPR_TEMP == RegType) )
  1723. {
  1724. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "After texdepth instruction, r5 is no longer available in shader." );
  1725. m_ErrorCount++;
  1726. return TRUE;
  1727. }
  1728. }
  1729. }
  1730. return TRUE;
  1731. }
  1732. //-----------------------------------------------------------------------------
  1733. // CPShaderValidator14::Rule_ValidDEFInstruction
  1734. //
  1735. // ** Rule:
  1736. // For the DEF instruction, make sure the dest parameter is a valid constant,
  1737. // and it has no modifiers.
  1738. //
  1739. // NOTE that we are pretending this instruction only has a dst parameter.
  1740. // We skipped over the 4 source parameters since they are immediate floats,
  1741. // for which there is nothing that can be checked.
  1742. //
  1743. // ** When to call:
  1744. // Per instruction.
  1745. //
  1746. // ** Returns:
  1747. // Always TRUE.
  1748. //
  1749. //-----------------------------------------------------------------------------
  1750. BOOL CPShaderValidator14::Rule_ValidDEFInstruction()
  1751. {
  1752. static BOOL s_bDEFInstructionAllowed;
  1753. if( NULL == m_pCurrInst->m_pPrevInst ) // First instruction - initialize static vars
  1754. {
  1755. s_bDEFInstructionAllowed = TRUE;
  1756. }
  1757. if( D3DSIO_COMMENT != m_pCurrInst->m_Type &&
  1758. D3DSIO_DEF != m_pCurrInst->m_Type )
  1759. {
  1760. s_bDEFInstructionAllowed = FALSE;
  1761. }
  1762. else if( D3DSIO_DEF == m_pCurrInst->m_Type )
  1763. {
  1764. if( !s_bDEFInstructionAllowed )
  1765. {
  1766. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "Const declaration (def) must appear before other instructions." );
  1767. m_ErrorCount++;
  1768. }
  1769. DSTPARAM* pDstParam = &m_pCurrInst->m_DstParam;
  1770. if( D3DSP_WRITEMASK_ALL != pDstParam->m_WriteMask ||
  1771. D3DSPDM_NONE != pDstParam->m_DstMod ||
  1772. DSTSHIFT_NONE != pDstParam->m_DstShift ||
  1773. D3DSPR_CONST != pDstParam->m_RegType
  1774. )
  1775. {
  1776. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "Destination for def instruction must be of the form c# (# = reg number, no modifiers)." );
  1777. m_ErrorCount++;
  1778. }
  1779. // Check that the register number is in bounds
  1780. if( D3DSPR_CONST == pDstParam->m_RegType &&
  1781. pDstParam->m_RegNum >= m_pConstRegFile->GetNumRegs() )
  1782. {
  1783. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "Invalid const register num: %d. Max allowed is %d.",
  1784. pDstParam->m_RegNum,m_pConstRegFile->GetNumRegs() - 1);
  1785. m_ErrorCount++;
  1786. }
  1787. }
  1788. return TRUE;
  1789. }
  1790. //-----------------------------------------------------------------------------
  1791. // CPShaderValidator14::Rule_ValidInstructionPairing
  1792. //
  1793. // ** Rule:
  1794. // - If an instruction is co-issued with another instruction,
  1795. // make sure that both do not write to any of RGB at the same time,
  1796. // and that neither instruction individually writes to all of RGBA.
  1797. //
  1798. // - Co-issue can only involve 2 instructions,
  1799. // so consecutive instructions cannot have the "+" prefix (D3DSI_COISSUE).
  1800. //
  1801. // - Co-issue of instructions only applies to pixel blend instructions (non tex-ops).
  1802. //
  1803. // - The first color blend instruction cannot have "+" (D3DSI_COISSUE) set either.
  1804. //
  1805. // - NOP may not be used in a co-issue pair.
  1806. //
  1807. // - DP3 (dot product) always uses the color/vector pipeline (even if it is not writing
  1808. // to color components). Thus:
  1809. // - An instruction co-issued with a dot-product can only write to alpha.
  1810. // - A dot-product that writes to alpha cannot be co-issued.
  1811. // - Two dot-products cannot be co-issued.
  1812. //
  1813. // - For version <= 1.0, coissued instructions must write to the same register.
  1814. //
  1815. // ------------------
  1816. // examples:
  1817. //
  1818. // valid pair: mov r0.a, c0
  1819. // +add r1.rgb, v1, c1 (note dst reg #'s can be different)
  1820. //
  1821. // another valid pair: mov r0.a, c0
  1822. // +add r0.rgb, v1, c1
  1823. //
  1824. // another valid pair: dp3 r0.rgb, t1, v1
  1825. // +mul r0.a, t0, v0
  1826. //
  1827. // another valid pair: mov r0.a, c0
  1828. // +add r0.a, t0, t1
  1829. //
  1830. // invalid pair: mov r0.rgb, c0
  1831. // +add r0, t0, t1 (note the dst writes to rgba)
  1832. //
  1833. // another invalid pair: mov r1.rgb, c1
  1834. // +dp3 r0.a, t0, t1 (dp3 is using up color/vector pipe)
  1835. //
  1836. // ** When to call:
  1837. // Per instruction.
  1838. //
  1839. // ** Returns:
  1840. // Always TRUE.
  1841. //
  1842. //-----------------------------------------------------------------------------
  1843. BOOL CPShaderValidator14::Rule_ValidInstructionPairing()
  1844. {
  1845. static BOOL s_bSeenArithOp;
  1846. BOOL bCurrInstCoIssuable = TRUE;
  1847. if( NULL == m_pCurrInst->m_pPrevInst ) // First instruction - initialize static vars
  1848. {
  1849. s_bSeenArithOp = FALSE;
  1850. }
  1851. if( !_CURR_PS_INST->m_bTexOp )
  1852. {
  1853. switch( m_pCurrInst->m_Type )
  1854. {
  1855. case D3DSIO_PHASE:
  1856. case D3DSIO_DEF:
  1857. case D3DSIO_NOP:
  1858. case D3DSIO_DP4:
  1859. bCurrInstCoIssuable = FALSE;
  1860. break;
  1861. }
  1862. }
  1863. if( D3DSIO_PHASE == m_pCurrInst->m_Type )
  1864. {
  1865. s_bSeenArithOp = FALSE;
  1866. }
  1867. else if( bCurrInstCoIssuable )
  1868. {
  1869. s_bSeenArithOp = TRUE;
  1870. }
  1871. if( !_CURR_PS_INST->m_bCoIssue )
  1872. return TRUE;
  1873. if( _CURR_PS_INST->m_bTexOp )
  1874. {
  1875. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst,
  1876. "Cannot set co-issue ('+') on a tex* instruction. Co-issue only applies to arithmetic instructions." );
  1877. m_ErrorCount++;
  1878. return TRUE;
  1879. }
  1880. if( !s_bSeenArithOp || NULL == m_pCurrInst->m_pPrevInst )
  1881. {
  1882. if( D3DSIO_PHASE == m_pCurrInst->m_Type )
  1883. {
  1884. // cannot have co-issue set because we haven't seen an arithmetic op above.
  1885. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst,
  1886. "Phase marker cannot be co-issued.");
  1887. }
  1888. else
  1889. {
  1890. // cannot have co-issue set because we haven't seen an arithmetic op above.
  1891. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst,
  1892. "Instruction cannot have co-issue ('+') set without a previous arithmetic instruction to pair with.");
  1893. }
  1894. m_ErrorCount++;
  1895. return TRUE;
  1896. }
  1897. if( _PREV_PS_INST->m_bCoIssue )
  1898. {
  1899. // consecutive instructions cannot have co-issue set.
  1900. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst, "Cannot set co-issue ('+') on consecutive instructions." );
  1901. m_ErrorCount++;
  1902. return TRUE;
  1903. }
  1904. for( UINT i = 0; i < 2; i++ )
  1905. {
  1906. CBaseInstruction* pInst;
  1907. if( 0 == i )
  1908. pInst = m_pCurrInst;
  1909. else
  1910. pInst = m_pCurrInst->m_pPrevInst;
  1911. switch( pInst->m_Type )
  1912. {
  1913. case D3DSIO_PHASE:
  1914. // Phase marker cannot be co-issued
  1915. Spew( SPEW_INSTRUCTION_ERROR, pInst, "phase marker cannot be co-issued." );
  1916. m_ErrorCount++;
  1917. return TRUE;
  1918. case D3DSIO_DEF:
  1919. // DEF cannot be co-issued
  1920. Spew( SPEW_INSTRUCTION_ERROR, pInst, "def cannot be co-issued." );
  1921. m_ErrorCount++;
  1922. return TRUE;
  1923. case D3DSIO_NOP:
  1924. // NOP cannot be co-issued
  1925. Spew( SPEW_INSTRUCTION_ERROR, pInst, "nop cannot be co-issued." );
  1926. m_ErrorCount++;
  1927. return TRUE;
  1928. case D3DSIO_DP4:
  1929. // DP4 cannot be co-issued
  1930. Spew( SPEW_INSTRUCTION_ERROR, pInst, "dp4 cannot be co-issued." );
  1931. m_ErrorCount++;
  1932. return TRUE;
  1933. case D3DSIO_BEM:
  1934. // BEM cannot be co-issued
  1935. Spew( SPEW_INSTRUCTION_ERROR, pInst, "bem cannot be co-issued." );
  1936. m_ErrorCount++;
  1937. return TRUE;
  1938. }
  1939. }
  1940. #define COLOR_WRITE_MASK (D3DSP_WRITEMASK_0 | D3DSP_WRITEMASK_1 | D3DSP_WRITEMASK_2)
  1941. #define ALPHA_WRITE_MASK D3DSP_WRITEMASK_3
  1942. DWORD CurrInstWriteMask = 0;
  1943. DWORD PrevInstWriteMask = 0;
  1944. if( m_pCurrInst->m_DstParam.m_bParamUsed )
  1945. CurrInstWriteMask = m_pCurrInst->m_DstParam.m_WriteMask;
  1946. if( m_pCurrInst->m_pPrevInst->m_DstParam.m_bParamUsed )
  1947. PrevInstWriteMask = m_pCurrInst->m_pPrevInst->m_DstParam.m_WriteMask;
  1948. if( D3DSIO_DP3 == m_pCurrInst->m_Type &&
  1949. D3DSIO_DP3 == m_pCurrInst->m_pPrevInst->m_Type )
  1950. {
  1951. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst,
  1952. "Co-issued instructions cannot both be dp3, since each require use of the color pipe to execute." );
  1953. m_ErrorCount++;
  1954. }
  1955. else if( D3DSIO_DP3 == m_pCurrInst->m_Type )
  1956. {
  1957. if( COLOR_WRITE_MASK & PrevInstWriteMask )
  1958. {
  1959. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst->m_pPrevInst,
  1960. "dp3 needs color pipe to execute, so instruction co-issued with it cannot write to color components." );
  1961. m_ErrorCount++;
  1962. }
  1963. if( D3DSP_WRITEMASK_3 & CurrInstWriteMask ) // alpha in addition to the implied rgb for dp3
  1964. {
  1965. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst,
  1966. "dp3 which writes alpha cannot co-issue since it uses up both the alpha and color pipes." );
  1967. m_ErrorCount++;
  1968. }
  1969. }
  1970. else if( D3DSIO_DP3 == m_pCurrInst->m_pPrevInst->m_Type )
  1971. {
  1972. if( COLOR_WRITE_MASK & CurrInstWriteMask )
  1973. {
  1974. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst->m_pPrevInst,
  1975. "dp3 needs color pipe to execute, so instruction co-issued with it cannot write to color components." );
  1976. m_ErrorCount++;
  1977. }
  1978. if( D3DSP_WRITEMASK_3 & PrevInstWriteMask ) // alpha in addition to the implied rgb for dp3
  1979. {
  1980. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst->m_pPrevInst,
  1981. "dp3 which writes alpha cannot co-issue since it uses up both the alpha and color pipes." );
  1982. m_ErrorCount++;
  1983. }
  1984. }
  1985. if( (PrevInstWriteMask & ALPHA_WRITE_MASK) && (PrevInstWriteMask & COLOR_WRITE_MASK))
  1986. {
  1987. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst->m_pPrevInst,
  1988. "Individual instruction in co-issue pair cannot write both alpha and color component(s)." );
  1989. m_ErrorCount++;
  1990. }
  1991. if( (CurrInstWriteMask & ALPHA_WRITE_MASK) && (CurrInstWriteMask & COLOR_WRITE_MASK))
  1992. {
  1993. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst,
  1994. "Individual instruction in co-issue pair cannot write both alpha and color component(s)." );
  1995. m_ErrorCount++;
  1996. }
  1997. if( CurrInstWriteMask & PrevInstWriteMask )
  1998. {
  1999. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst,
  2000. "Co-issued instructions cannot both write to the same component(s). One instruction must write to alpha and the other may write to any combination of red/green/blue. Destination registers may differ." );
  2001. m_ErrorCount++;
  2002. }
  2003. if( !((CurrInstWriteMask | PrevInstWriteMask) & ALPHA_WRITE_MASK) )
  2004. {
  2005. Spew( SPEW_INSTRUCTION_ERROR, m_pCurrInst,
  2006. "One of the instructions in a co-issue pair must write to alpha only (.a writemask)." );
  2007. m_ErrorCount++;
  2008. }
  2009. return TRUE;
  2010. }
  2011. //-----------------------------------------------------------------------------
  2012. // CPShaderValidator14::Rule_ValidInstructionCount
  2013. //
  2014. // ** Rule:
  2015. // Make sure instruction count for pixel shader version has not been exceeded.
  2016. //
  2017. // Co-issued pixel blending instructions only
  2018. // count as one instruction towards the limit.
  2019. //
  2020. // The def instruction, nop, and comments (already stripped), do not count
  2021. // toward any limits.
  2022. //
  2023. // ** When to call:
  2024. // Per instruction AND after all instructions seen.
  2025. //
  2026. // ** Returns:
  2027. // Always TRUE.
  2028. //
  2029. //-----------------------------------------------------------------------------
  2030. BOOL CPShaderValidator14::Rule_ValidInstructionCount()
  2031. {
  2032. static UINT s_MaxTexOpCount;
  2033. static UINT s_MaxArithmeticOpCount;
  2034. if( NULL == m_pCurrInst )
  2035. return TRUE;
  2036. if( NULL == m_pCurrInst->m_pPrevInst ) // First instruction - initialize static vars
  2037. {
  2038. m_TexOpCount = 0;
  2039. m_BlendOpCount = 0;
  2040. m_TotalOpCount = 0;
  2041. switch(m_Version)
  2042. {
  2043. default:
  2044. case D3DPS_VERSION(1,4): // DX8.1
  2045. s_MaxTexOpCount = 6;
  2046. s_MaxArithmeticOpCount = 8;
  2047. break;
  2048. }
  2049. }
  2050. if( m_bSeenAllInstructions || D3DSIO_PHASE == m_pCurrInst->m_Type )
  2051. {
  2052. if( m_pCurrInst && (D3DSIO_PHASE == m_pCurrInst->m_Type) )
  2053. {
  2054. if( m_TexOpCount > s_MaxTexOpCount )
  2055. {
  2056. Spew( SPEW_GLOBAL_ERROR, NULL, "Too many (%d) tex* instructions before phase marker. Max. allowed in a phase is %d.",
  2057. m_TexOpCount, s_MaxTexOpCount);
  2058. m_ErrorCount++;
  2059. }
  2060. if( m_BlendOpCount > s_MaxArithmeticOpCount )
  2061. {
  2062. Spew( SPEW_GLOBAL_ERROR, NULL, "Too many (%d) arithmetic instructions before phase marker. Max. allowed in a phase (counting any co-issued pairs as 1) is %d.",
  2063. m_BlendOpCount, s_MaxArithmeticOpCount);
  2064. m_ErrorCount++;
  2065. }
  2066. }
  2067. else // 2 == m_Phase
  2068. {
  2069. if( m_bPhaseMarkerInShader )
  2070. {
  2071. if( m_TexOpCount > s_MaxTexOpCount )
  2072. {
  2073. Spew( SPEW_GLOBAL_ERROR, NULL, "Too many (%d) tex* instructions after phase marker. Max. allowed in a phase is %d.",
  2074. m_TexOpCount, s_MaxTexOpCount);
  2075. m_ErrorCount++;
  2076. }
  2077. if( m_BlendOpCount > s_MaxArithmeticOpCount )
  2078. {
  2079. Spew( SPEW_GLOBAL_ERROR, NULL, "Too many (%d) arithmetic instructions after phase marker. Max. allowed in a phase (counting any co-issued pairs as 1) is %d.",
  2080. m_BlendOpCount, s_MaxArithmeticOpCount);
  2081. m_ErrorCount++;
  2082. }
  2083. }
  2084. else // defaulted to phase 2 because no phase marker was in shader
  2085. {
  2086. if( m_TexOpCount > s_MaxTexOpCount )
  2087. {
  2088. Spew( SPEW_GLOBAL_ERROR, NULL, "Too many (%d) tex* instructions. Max. allowed is %d. Note that adding a phase marker to the shader would double the number of instructions available.",
  2089. m_TexOpCount, s_MaxTexOpCount);
  2090. m_ErrorCount++;
  2091. }
  2092. if( m_BlendOpCount > s_MaxArithmeticOpCount )
  2093. {
  2094. Spew( SPEW_GLOBAL_ERROR, NULL, "Too many (%d) arithmetic instructions. Max. allowed (counting any co-issued pairs as 1) is %d. Note that adding a phase marker to the shader would double the number of instructions available.",
  2095. m_BlendOpCount, s_MaxArithmeticOpCount);
  2096. m_ErrorCount++;
  2097. }
  2098. }
  2099. }
  2100. if( m_pCurrInst && D3DSIO_PHASE == m_pCurrInst->m_Type )
  2101. {
  2102. // reset counters for next phase.
  2103. m_TexOpCount = 0;
  2104. m_BlendOpCount = 0;
  2105. m_TotalOpCount = 0;
  2106. }
  2107. return TRUE;
  2108. }
  2109. switch(m_pCurrInst->m_Type)
  2110. {
  2111. case D3DSIO_TEX:
  2112. case D3DSIO_TEXCOORD:
  2113. case D3DSIO_TEXKILL:
  2114. case D3DSIO_TEXDEPTH:
  2115. m_TexOpCount++;
  2116. m_TotalOpCount++;
  2117. break;
  2118. case D3DSIO_MOV:
  2119. case D3DSIO_ADD:
  2120. case D3DSIO_SUB:
  2121. case D3DSIO_MUL:
  2122. case D3DSIO_MAD:
  2123. case D3DSIO_LRP:
  2124. case D3DSIO_DP3:
  2125. case D3DSIO_CND:
  2126. case D3DSIO_CMP:
  2127. case D3DSIO_DP4:
  2128. if( !_CURR_PS_INST->m_bCoIssue )
  2129. {
  2130. m_BlendOpCount++;
  2131. m_TotalOpCount++;
  2132. }
  2133. break;
  2134. case D3DSIO_BEM:
  2135. m_BlendOpCount+=2;
  2136. m_TotalOpCount+=2;
  2137. break;
  2138. case D3DSIO_END:
  2139. case D3DSIO_NOP:
  2140. case D3DSIO_DEF:
  2141. break;
  2142. default:
  2143. DXGASSERT(FALSE);
  2144. }
  2145. return TRUE;
  2146. }
  2147. //-----------------------------------------------------------------------------
  2148. // CPShaderValidator14::Rule_R0Written
  2149. //
  2150. // ** Rule:
  2151. // All components (r,g,b,a) of register R0 must have been written by the
  2152. // pixel shader.
  2153. //
  2154. // ** When to call:
  2155. // After all instructions have been seen.
  2156. //
  2157. // ** Returns:
  2158. // Always TRUE.
  2159. //
  2160. //-----------------------------------------------------------------------------
  2161. BOOL CPShaderValidator14::Rule_R0Written()
  2162. {
  2163. UINT NumUninitializedComponents = 0;
  2164. DWORD UninitializedComponentsMask = 0;
  2165. for( UINT i = 0; i < NUM_COMPONENTS_IN_REGISTER; i++ )
  2166. {
  2167. if( NULL == m_pTempRegFile->m_pAccessHistory[i][0].m_pMostRecentWriter )
  2168. {
  2169. NumUninitializedComponents++;
  2170. UninitializedComponentsMask |= COMPONENT_MASKS[i];
  2171. }
  2172. }
  2173. if( NumUninitializedComponents )
  2174. {
  2175. if( (UninitializedComponentsMask & COMPONENT_MASKS[3]) &&
  2176. (m_TempRegsWithZappedAlpha & (1 << 0 /*regnum=0*/ ) ) &&
  2177. (UninitializedComponentsMask & COMPONENT_MASKS[2]) &&
  2178. (m_TempRegsWithZappedBlue & (1 << 0 /*regnum=0*/ ) ) )
  2179. {
  2180. Spew( SPEW_GLOBAL_ERROR, NULL, "r0 must be written by shader. Uninitialized component%s(*): %s. "\
  2181. ZAPPED_BLUE_TEXT2 " Also: " ZAPPED_ALPHA_TEXT2,
  2182. NumUninitializedComponents > 1 ? "s" : "", MakeAffectedComponentsText(UninitializedComponentsMask,TRUE,FALSE));
  2183. }
  2184. else if( (UninitializedComponentsMask & COMPONENT_MASKS[3]) &&
  2185. (m_TempRegsWithZappedAlpha & (1 << 0 /*regnum=0*/ ) ) )
  2186. {
  2187. Spew( SPEW_GLOBAL_ERROR, NULL, "r0 must be written by shader. Uninitialized component%s(*): %s. "\
  2188. ZAPPED_ALPHA_TEXT2,
  2189. NumUninitializedComponents > 1 ? "s" : "", MakeAffectedComponentsText(UninitializedComponentsMask,TRUE,FALSE));
  2190. }
  2191. else if( (UninitializedComponentsMask & COMPONENT_MASKS[2]) &&
  2192. (m_TempRegsWithZappedBlue & (1 << 0 /*regnum=0*/ ) ) )
  2193. {
  2194. Spew( SPEW_GLOBAL_ERROR, NULL, "r0 must be written by shader. Uninitialized component%s(*): %s. "\
  2195. ZAPPED_BLUE_TEXT2,
  2196. NumUninitializedComponents > 1 ? "s" : "", MakeAffectedComponentsText(UninitializedComponentsMask,TRUE,FALSE));
  2197. }
  2198. else
  2199. {
  2200. Spew( SPEW_GLOBAL_ERROR, NULL, "r0 must be written by shader. Uninitialized component%s(*): %s",
  2201. NumUninitializedComponents > 1 ? "s" : "", MakeAffectedComponentsText(UninitializedComponentsMask,TRUE,FALSE));
  2202. }
  2203. m_ErrorCount++;
  2204. }
  2205. return TRUE;
  2206. }