//========= Copyright Valve Corporation, All rights reserved. ============//
// TOGL CODE LICENSE
//
// Copyright 2011-2014 Valve Corporation
// All Rights Reserved.
//
// Permission is hereby granted, free of charge, to any person obtaining a copy
// of this software and associated documentation files (the "Software"), to deal
// in the Software without restriction, including without limitation the rights
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
// copies of the Software, and to permit persons to whom the Software is
// furnished to do so, subject to the following conditions:
//
// The above copyright notice and this permission notice shall be included in
// all copies or substantial portions of the Software.
//
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
// THE SOFTWARE.
//------------------------------------------------------------------------------
// DX9AsmToGL2.cpp
//------------------------------------------------------------------------------
// Immediately include gl.h, etc. here to avoid compilation warnings.
# include <GL/gl.h>
# include <GL/glext.h>
# include "togles/rendermechanism.h"
# include "tier0/dbg.h"
# include "tier1/strtools.h"
# include "tier1/utlbuffer.h"
# include "dx9asmtogl2.h"
# include "materialsystem/IShader.h"
// memdbgon must be the last include file in a .cpp file!!!
# include "tier0/memdbgon.h"
# ifdef POSIX
# define strcat_s( a, b, c) V_strcat( a, c, b )
# endif
# define DST_REGISTER 0
# define SRC_REGISTER 1
// Flags to PrintUsageAndIndexToString.
# define SEMANTIC_OUTPUT 0x01
# define SEMANTIC_INPUT 0x02
# define UNDECLARED_OUTPUT 0xFFFFFFFF
# define UNDECLARED_INPUT 0xFFFFFFFF
# ifndef POSIX
# define Debugger() Assert(0)
# endif
//#define Assert(n) if( !(n) ){ TranslationError(); }
static char g_szShadow2D [ ] =
" uniform sampler2D u_ShadowMap; \n "
" #define invSize 0.001953125 \n "
" #define size 512.0 \n "
" vec4 _shadow2D( sampler2D u_depthTex, vec3 suv) \n "
" { \n "
" vec2 p1 = suv.xy; \n "
" vec2 p2 = suv.xy+vec2(0.0,invSize); \n "
" vec2 p3 = suv.xy+vec2(invSize,0.0); \n "
" vec2 p4 = suv.xy+vec2(invSize); \n "
" float d = texture(u_depthTex,p1).r; \n "
" float r = float(d>suv.z); \n "
" d = texture(u_depthTex,p2).r; \n "
" float r2 = float(d>suv.z); \n "
" d = texture(u_depthTex,p3).r; \n "
" float r3 = float(d>suv.z); \n "
" d = texture(u_depthTex,p4).r; \n "
" float r4 = float(d>suv.z); \n "
" p1*=size; \n "
" float a = p1.y-floor(p1.y); \n "
" float b = p1.x-floor(p1.x); \n "
" float gg = mix(mix(r,r2,a),mix(r3,r4,a),b); \n "
" return vec4(gg, gg, gg, gg); "
" } \n "
" #define shadow2D _shadow2D \n " ;
static char g_szShadow2DProj [ ] =
" float _shadow2DProj( vec4 projection, vec2 texel, float NdotL ) \n "
" { \n "
" vec3 coord = vec3( projection.xyz / ( projection.w + 0.0005 )); // z-bias \n "
" coord.s = float( clamp( float( coord.s ), texel.x, 1.0 - texel.x )); \n "
" coord.t = float( clamp( float( coord.t ), texel.y, 1.0 - texel.y )); \n "
" coord.r = float( clamp( float( coord.r ), 0.0, 1.0 )); \n "
" return _shadow2D( u_ShadowMap, coord ); \n "
" } \n "
" #define shadow2DProj _shadow2DProj \n " ;
static char * g_szVecZeros [ ] = { NULL , " 0.0 " , " vec2( 0.0, 0.0 ) " , " vec3( 0.0, 0.0, 0.0 ) " , " vec4( 0.0, 0.0, 0.0, 0.0 ) " } ;
static char * g_szVecOnes [ ] = { NULL , " 1.0 " , " vec2( 1.0, 1.0 ) " , " vec3( 1.0, 1.0, 1.0 ) " , " vec4( 1.0, 1.0, 1.0, 1.0 ) " } ;
static char * g_szDefaultSwizzle = " xyzw " ;
static char * g_szDefaultSwizzleStrings [ ] = { " x " , " y " , " z " , " w " } ;
static char * g_szSamplerStrings [ ] = { " 2D " , " CUBE " , " 3D " } ;
static const char * g_pAtomicTempVarName = " atomic_temp_var " ;
static const char * g_pTangentAttributeName = " g_tangent " ;
int __cdecl SortInts ( const int * a , const int * b )
{
if ( * a < * b )
return - 1 ;
else if ( * a > * b )
return 1 ;
else
return 0 ;
}
void StripExtraTrailingZeros ( char * pStr )
{
int len = ( int ) V_strlen ( pStr ) ;
while ( len > = 2 & & pStr [ len - 1 ] = = ' 0 ' & & pStr [ len - 2 ] ! = ' . ' )
{
pStr [ len - 1 ] = 0 ;
- - len ;
}
}
void D3DToGL : : PrintToBufWithIndents ( CUtlBuffer & buf , const char * pFormat , . . . )
{
va_list marker ;
va_start ( marker , pFormat ) ;
char szTemp [ 1024 ] ;
V_vsnprintf ( szTemp , sizeof ( szTemp ) , pFormat , marker ) ;
va_end ( marker ) ;
PrintIndentation ( ( char * ) buf . Base ( ) , buf . Size ( ) ) ;
strcat_s ( ( char * ) buf . Base ( ) , buf . Size ( ) , szTemp ) ;
}
void PrintToBuf ( CUtlBuffer & buf , const char * pFormat , . . . )
{
va_list marker ;
va_start ( marker , pFormat ) ;
char szTemp [ 1024 ] ;
V_vsnprintf ( szTemp , sizeof ( szTemp ) , pFormat , marker ) ;
va_end ( marker ) ;
strcat_s ( ( char * ) buf . Base ( ) , buf . Size ( ) , szTemp ) ;
}
void PrintToBuf ( char * pOut , int nOutSize , const char * pFormat , . . . )
{
int nStrlen = V_strlen ( pOut ) ;
pOut + = nStrlen ;
nOutSize - = nStrlen ;
va_list marker ;
va_start ( marker , pFormat ) ;
V_vsnprintf ( pOut , nOutSize , pFormat , marker ) ;
va_end ( marker ) ;
}
// Return the number of letters following the dot.
// Returns 4 if there is no dot.
// (So "r0.xy" returns 2 and "r0" returns 4).
int GetNumWriteMaskEntries ( const char * pParam )
{
const char * pDot = strchr ( pParam , ' . ' ) ;
if ( pDot )
return V_strlen ( pDot + 1 ) ;
else
return 4 ;
}
const char * GetSwizzleDot ( const char * pParam )
{
const char * pDot = strrchr ( pParam , ' . ' ) ;
const char * pSquareClose = strrchr ( pParam , ' ] ' ) ;
if ( pSquareClose )
{
// The test against ']' catches cases like, so we point to the last dot vc[int(va_r.x) + 29].x
if ( pDot & & ( pSquareClose < pDot ) )
return pDot ;
else
return NULL ;
}
// Make sure the next character is a valid swizzle since we want to treat strings like vec4( gl_Normal, 0.0 ) as a whole param name.
if ( pDot & & ( ( * ( pDot + 1 ) = = ' x ' ) | | ( * ( pDot + 1 ) = = ' y ' ) | | ( * ( pDot + 1 ) = = ' z ' ) | | ( * ( pDot + 1 ) = = ' w ' ) | |
( * ( pDot + 1 ) = = ' r ' ) | | ( * ( pDot + 1 ) = = ' g ' ) | | ( * ( pDot + 1 ) = = ' b ' ) | | ( * ( pDot + 1 ) = = ' z ' ) ) )
{
return pDot ;
}
return NULL ;
}
int GetNumSwizzleComponents ( const char * pParam )
{
// Special scalar output which won't accept a swizzle
if ( ! V_stricmp ( pParam , " gl_FogFragCoord " ) )
return 1 ;
// Special scalar output which won't accept a swizzle
if ( ! V_stricmp ( pParam , " gl_FragDepth " ) )
return 1 ;
// Special scalar output which won't accept a swizzle
if ( ! V_stricmp ( pParam , " a0 " ) )
return 1 ;
const char * pDot = GetSwizzleDot ( pParam ) ;
if ( pDot )
{
pDot + + ; // Step over the dot
int nNumSwizzleComponents = 0 ;
while ( ( * pDot = = ' x ' ) | | ( * pDot = = ' y ' ) | | ( * pDot = = ' z ' ) | | ( * pDot = = ' w ' ) | |
( * pDot = = ' r ' ) | | ( * pDot = = ' g ' ) | | ( * pDot = = ' b ' ) | | ( * pDot = = ' z ' ) )
{
nNumSwizzleComponents + + ;
pDot + + ;
}
return nNumSwizzleComponents ;
}
return 0 ;
}
char GetSwizzleComponent ( const char * pParam , int n )
{
Assert ( n < 4 ) ;
const char * pDot = GetSwizzleDot ( pParam ) ;
if ( pDot )
{
+ + pDot ;
int nComponents = ( int ) V_strlen ( pDot ) ;
Assert ( nComponents > 0 ) ;
if ( n < nComponents )
return pDot [ n ] ;
else
return pDot [ nComponents - 1 ] ;
}
return g_szDefaultSwizzle [ n ] ;
}
// Replace the parameter name and leave the swizzle intact.
// So "somevar.xyz" becomes "othervar.xyz".
void ReplaceParamName ( const char * pSrc , const char * pNewParamName , char * pOut , int nOutLen )
{
// Start with the new parameter name.
V_strncpy ( pOut , pNewParamName , nOutLen ) ;
// Now add the swizzle if necessary.
const char * pDot = GetSwizzleDot ( pSrc ) ;
if ( pDot )
{
V_strncat ( pOut , pDot , nOutLen ) ;
}
}
void GetParamNameWithoutSwizzle ( const char * pParam , char * pOut , int nOutLen )
{
char * pParamStart = ( char * ) pParam ;
const char * pDot = GetSwizzleDot ( pParam ) ; // dot followed by valid swizzle characters
bool bAbsWrapper = false ;
// Check for abs() or -abs() wrapper and strip it off during the fixup
if ( ! V_strncmp ( pParam , " abs( " , 4 ) | | ! V_strncmp ( pParam , " -abs( " , 5 ) )
{
const char * pOpenParen = strchr ( pParam , ' ( ' ) ; // FIRST opening paren
const char * pClosingParen = strrchr ( pParam , ' ) ' ) ; // LAST closing paren
Assert ( pOpenParen & & pClosingParen ) ;
pClosingParen ; // hush compiler
pParamStart = ( char * ) pOpenParen ;
pParamStart + + ;
bAbsWrapper = true ;
}
if ( pDot )
{
int nToCopy = MIN ( nOutLen - 1 , pDot - pParamStart ) ;
memcpy ( pOut , pParamStart , nToCopy ) ;
pOut [ nToCopy ] = 0 ;
}
else
{
V_strncpy ( pOut , pParamStart , bAbsWrapper ? nOutLen - 1 : nOutLen ) ;
}
}
bool DoParamNamesMatch ( const char * pParam1 , const char * pParam2 )
{
char szTemp [ 2 ] [ 256 ] ;
GetParamNameWithoutSwizzle ( pParam1 , szTemp [ 0 ] , sizeof ( szTemp [ 0 ] ) ) ;
GetParamNameWithoutSwizzle ( pParam2 , szTemp [ 1 ] , sizeof ( szTemp [ 1 ] ) ) ;
return ( V_stricmp ( szTemp [ 0 ] , szTemp [ 1 ] ) = = 0 ) ;
}
// Extract the n'th component of the swizzle mask.
// If n would exceed the length of the swizzle mask, then it looks up into "xyzw".
void WriteParamWithSingleMaskEntry ( const char * pParam , int n , char * pOut , int nOutLen )
{
bool bCloseParen = false ;
if ( ! V_strncmp ( pParam , " -abs( " , 5 ) )
{
V_strcpy ( pOut , " -abs( " ) ;
bCloseParen = true ;
pOut + = 5 ; nOutLen - = 5 ;
}
else if ( ! V_strncmp ( pParam , " abs( " , 4 ) )
{
V_strcpy ( pOut , " abs( " ) ;
bCloseParen = true ;
pOut + = 4 ; nOutLen - = 4 ;
}
GetParamNameWithoutSwizzle ( pParam , pOut , nOutLen ) ;
PrintToBuf ( pOut , nOutLen , " . " ) ;
PrintToBuf ( pOut , nOutLen , " %c " , GetSwizzleComponent ( pParam , n ) ) ;
if ( bCloseParen )
{
PrintToBuf ( pOut , nOutLen , " ) " ) ;
}
}
float uint32ToFloat ( uint32 dw )
{
return * ( ( float * ) & dw ) ;
}
CUtlString EnsureNumSwizzleComponents ( const char * pSrcRegisterName , int nComponents )
{
int nExisting = GetNumSwizzleComponents ( pSrcRegisterName ) ;
if ( nExisting = = nComponents )
return pSrcRegisterName ;
bool bAbsWrapper = false ; // Parameter wrapped in an abs()
bool bAbsNegative = false ; // -abs()
char szSrcRegister [ 128 ] ;
V_strncpy ( szSrcRegister , pSrcRegisterName , sizeof ( szSrcRegister ) ) ;
// Check for abs() or -abs() wrapper and strip it off during the fixup
if ( ! V_strncmp ( pSrcRegisterName , " abs( " , 4 ) | | ! V_strncmp ( pSrcRegisterName , " -abs( " , 5 ) )
{
bAbsWrapper = true ;
bAbsNegative = pSrcRegisterName [ 0 ] = = ' - ' ;
const char * pOpenParen = strchr ( pSrcRegisterName , ' ( ' ) ; // FIRST opening paren
const char * pClosingParen = strrchr ( pSrcRegisterName , ' ) ' ) ; // LAST closing paren
Assert ( pOpenParen & & pClosingParen ) ; // If we start with abs( and don't get both parens, something is very wrong
// Copy out just the register name with no abs()
int nRegNameLength = pClosingParen - pOpenParen - 1 ;
V_strncpy ( szSrcRegister , pOpenParen + 1 , nRegNameLength + 1 ) ; // Kind of a weird function...copy more than you need and slam the last char to NULL-terminate
}
char szReg [ 256 ] ;
GetParamNameWithoutSwizzle ( szSrcRegister , szReg , sizeof ( szReg ) ) ;
if ( nComponents = = 0 )
return szReg ;
PrintToBuf ( szReg , sizeof ( szReg ) , " . " ) ;
if ( nExisting > nComponents )
{
// DX ASM will sometimes have statements like "NRM r0.xyz, r1.yzww", where it just doesn't use the last part of r1. So we won't either.
for ( int i = 0 ; i < nComponents ; i + + )
{
PrintToBuf ( szReg , sizeof ( szReg ) , " %c " , GetSwizzleComponent ( szSrcRegister , i ) ) ;
}
}
else
{
if ( nExisting = = 0 )
{
// We've got something like r0 and need N more components, so add as much of "xyzw" is needed.
for ( int i = 0 ; i < nComponents ; i + + )
PrintToBuf ( szReg , sizeof ( szReg ) , " %c " , g_szDefaultSwizzle [ i ] ) ;
}
else
{
// We've got something like r0.x and need N more components, so replicate the X so it looks like r0.xxx
V_strncpy ( szReg , szSrcRegister , sizeof ( szReg ) ) ;
char cLast = szSrcRegister [ V_strlen ( szSrcRegister ) - 1 ] ;
for ( int i = nExisting ; i < nComponents ; i + + )
{
PrintToBuf ( szReg , sizeof ( szReg ) , " %c " , cLast ) ;
}
}
}
if ( bAbsWrapper )
{
char szTemp [ 128 ] ;
V_strncpy ( szTemp , szReg , sizeof ( szTemp ) ) ;
V_snprintf ( szReg , sizeof ( szReg ) , " %sabs(%s) " , bAbsNegative ? " - " : " " , szTemp ) ;
}
return szReg ;
}
static void TranslationError ( )
{
GLMDebugPrintf ( " D3DToGL: GLSL translation error! \n " ) ;
DebuggerBreakIfDebugging ( ) ;
Error ( " D3DToGL: GLSL translation error! \n " ) ;
}
D3DToGL : : D3DToGL ( )
{
}
uint32 D3DToGL : : GetNextToken ( void )
{
uint32 dwToken = * m_pdwNextToken ;
m_pdwNextToken + + ;
return dwToken ;
}
void D3DToGL : : SkipTokens ( uint32 numToSkip )
{
m_pdwNextToken + = numToSkip ;
}
uint32 D3DToGL : : Opcode ( uint32 dwToken )
{
return ( dwToken & D3DSI_OPCODE_MASK ) ;
}
uint32 D3DToGL : : OpcodeSpecificData ( uint32 dwToken )
{
return ( ( dwToken & D3DSP_OPCODESPECIFICCONTROL_MASK ) > > D3DSP_OPCODESPECIFICCONTROL_SHIFT ) ;
}
uint32 D3DToGL : : TextureType ( uint32 dwToken )
{
return ( dwToken & D3DSP_TEXTURETYPE_MASK ) ; // Note this one doesn't shift due to weird D3DSAMPLER_TEXTURE_TYPE enum
}
// Print GLSL intrinsic corresponding to particular instruction
bool D3DToGL : : OpenIntrinsic ( uint32 inst , char * buff , int nBufLen , uint32 destDimension , uint32 nArgumentDimension )
{
// Some GLSL intrinsics need type conversion, which we do in this routine
// As a result, the caller must sometimes close both parentheses, not just one
bool bDoubleClose = false ;
if ( nArgumentDimension = = 0 )
{
nArgumentDimension = 4 ;
}
switch ( inst )
{
case D3DSIO_RSQ :
V_snprintf ( buff , nBufLen , " inversesqrt( " ) ;
break ;
case D3DSIO_DP3 :
case D3DSIO_DP4 :
if ( destDimension = = 1 )
{
V_snprintf ( buff , nBufLen , " dot( " ) ;
}
else
{
if ( ! destDimension )
destDimension = 4 ;
V_snprintf ( buff , nBufLen , " vec%d( dot( " , destDimension ) ;
bDoubleClose = true ;
}
break ;
case D3DSIO_MIN :
V_snprintf ( buff , nBufLen , " min( " ) ;
break ;
case D3DSIO_MAX :
V_snprintf ( buff , nBufLen , " max( " ) ;
break ;
case D3DSIO_SLT :
if ( nArgumentDimension = = 1 )
{
V_snprintf ( buff , nBufLen , " float( " ) ; // lessThan doesn't have a scalar version
}
else
{
Assert ( nArgumentDimension > 1 ) ;
V_snprintf ( buff , nBufLen , " vec%d( lessThan( " , nArgumentDimension ) ;
bDoubleClose = true ;
}
break ;
case D3DSIO_SGE :
if ( nArgumentDimension = = 1 )
{
V_snprintf ( buff , nBufLen , " float( " ) ; // greaterThanEqual doesn't have a scalar version
}
else
{
Assert ( nArgumentDimension > 1 ) ;
V_snprintf ( buff , nBufLen , " vec%d( greaterThanEqual( " , nArgumentDimension ) ;
bDoubleClose = true ;
}
break ;
case D3DSIO_EXP :
V_snprintf ( buff , nBufLen , " exp( " ) ; // exp2 ?
break ;
case D3DSIO_LOG :
V_snprintf ( buff , nBufLen , " log( " ) ; // log2 ?
break ;
case D3DSIO_LIT :
TranslationError ( ) ;
V_snprintf ( buff , nBufLen , " lit( " ) ; // gonna have to write this one
break ;
case D3DSIO_DST :
V_snprintf ( buff , nBufLen , " dst( " ) ; // gonna have to write this one
break ;
case D3DSIO_LRP :
Assert ( ! m_bVertexShader ) ;
V_snprintf ( buff , nBufLen , " mix( " ) ;
break ;
case D3DSIO_FRC :
V_snprintf ( buff , nBufLen , " fract( " ) ;
break ;
case D3DSIO_M4x4 :
TranslationError ( ) ;
V_snprintf ( buff , nBufLen , " m4x4 " ) ;
break ;
case D3DSIO_M4x3 :
case D3DSIO_M3x4 :
case D3DSIO_M3x3 :
case D3DSIO_M3x2 :
case D3DSIO_CALL :
case D3DSIO_CALLNZ :
case D3DSIO_LOOP :
case D3DSIO_RET :
case D3DSIO_ENDLOOP :
case D3DSIO_LABEL :
case D3DSIO_DCL :
TranslationError ( ) ;
break ;
case D3DSIO_POW :
V_snprintf ( buff , nBufLen , " pow( " ) ;
break ;
case D3DSIO_CRS :
V_snprintf ( buff , nBufLen , " cross( " ) ;
break ;
case D3DSIO_SGN :
TranslationError ( ) ;
V_snprintf ( buff , nBufLen , " sign( " ) ;
break ;
case D3DSIO_ABS :
V_snprintf ( buff , nBufLen , " abs( " ) ;
break ;
case D3DSIO_NRM :
TranslationError ( ) ;
V_snprintf ( buff , nBufLen , " normalize( " ) ;
break ;
case D3DSIO_SINCOS :
TranslationError ( ) ;
V_snprintf ( buff , nBufLen , " sincos( " ) ; // gonna have to write this one
break ;
case D3DSIO_REP :
case D3DSIO_ENDREP :
case D3DSIO_IF :
case D3DSIO_IFC :
case D3DSIO_ELSE :
case D3DSIO_ENDIF :
case D3DSIO_BREAK :
case D3DSIO_BREAKC : // TODO: these are the reason we even need GLSL...gotta make these work
TranslationError ( ) ;
break ;
case D3DSIO_DEFB :
case D3DSIO_DEFI :
TranslationError ( ) ;
break ;
case D3DSIO_TEXCOORD :
V_snprintf ( buff , nBufLen , " texcoord " ) ;
break ;
case D3DSIO_TEXKILL :
V_snprintf ( buff , nBufLen , " kill( " ) ; // wrap the discard instruction?
break ;
case D3DSIO_TEX :
TranslationError ( ) ;
V_snprintf ( buff , nBufLen , " TEX " ) ; // We shouldn't get here
break ;
case D3DSIO_TEXBEM :
case D3DSIO_TEXBEML :
case D3DSIO_TEXREG2AR :
case D3DSIO_TEXREG2GB :
case D3DSIO_TEXM3x2PAD :
case D3DSIO_TEXM3x2TEX :
case D3DSIO_TEXM3x3PAD :
case D3DSIO_TEXM3x3TEX :
case D3DSIO_TEXM3x3SPEC :
case D3DSIO_TEXM3x3VSPEC :
TranslationError ( ) ;
break ;
case D3DSIO_EXPP :
V_snprintf ( buff , nBufLen , " exp( " ) ;
break ;
case D3DSIO_LOGP :
V_snprintf ( buff , nBufLen , " log( " ) ;
break ;
case D3DSIO_CND :
TranslationError ( ) ;
break ;
case D3DSIO_DEF :
TranslationError ( ) ;
V_snprintf ( buff , nBufLen , " DEF " ) ;
break ;
case D3DSIO_TEXREG2RGB :
case D3DSIO_TEXDP3TEX :
case D3DSIO_TEXM3x2DEPTH :
case D3DSIO_TEXDP3 :
case D3DSIO_TEXM3x3 :
TranslationError ( ) ;
break ;
case D3DSIO_TEXDEPTH :
V_snprintf ( buff , nBufLen , " texdepth " ) ;
break ;
case D3DSIO_CMP :
TranslationError ( ) ;
Assert ( ! m_bVertexShader ) ;
V_snprintf ( buff , nBufLen , " CMP " ) ;
break ;
case D3DSIO_BEM :
TranslationError ( ) ;
break ;
case D3DSIO_DP2ADD :
TranslationError ( ) ;
break ;
case D3DSIO_DSX :
case D3DSIO_DSY :
TranslationError ( ) ;
break ;
case D3DSIO_TEXLDD :
V_snprintf ( buff , nBufLen , " texldd " ) ;
break ;
case D3DSIO_SETP :
TranslationError ( ) ;
break ;
case D3DSIO_TEXLDL :
V_snprintf ( buff , nBufLen , " texldl " ) ;
break ;
case D3DSIO_BREAKP :
case D3DSIO_PHASE :
TranslationError ( ) ;
break ;
}
return bDoubleClose ;
}
const char * D3DToGL : : GetGLSLOperatorString ( uint32 inst )
{
if ( inst = = D3DSIO_ADD )
return " + " ;
else if ( inst = = D3DSIO_SUB )
return " - " ;
else if ( inst = = D3DSIO_MUL )
return " * " ;
Error ( " GetGLSLOperatorString: unknown operator " ) ;
return " zzzz " ;
}
// Print ASM opcode
void D3DToGL : : PrintOpcode ( uint32 inst , char * buff , int nBufLen )
{
switch ( inst )
{
case D3DSIO_NOP :
V_snprintf ( buff , nBufLen , " NOP " ) ;
TranslationError ( ) ;
break ;
case D3DSIO_MOV :
V_snprintf ( buff , nBufLen , " MOV " ) ;
break ;
case D3DSIO_ADD :
V_snprintf ( buff , nBufLen , " ADD " ) ;
break ;
case D3DSIO_SUB :
V_snprintf ( buff , nBufLen , " SUB " ) ;
break ;
case D3DSIO_MAD :
V_snprintf ( buff , nBufLen , " MAD " ) ;
break ;
case D3DSIO_MUL :
V_snprintf ( buff , nBufLen , " MUL " ) ;
break ;
case D3DSIO_RCP :
V_snprintf ( buff , nBufLen , " RCP " ) ;
break ;
case D3DSIO_RSQ :
V_snprintf ( buff , nBufLen , " RSQ " ) ;
break ;
case D3DSIO_DP3 :
V_snprintf ( buff , nBufLen , " DP3 " ) ;
break ;
case D3DSIO_DP4 :
V_snprintf ( buff , nBufLen , " DP4 " ) ;
break ;
case D3DSIO_MIN :
V_snprintf ( buff , nBufLen , " MIN " ) ;
break ;
case D3DSIO_MAX :
V_snprintf ( buff , nBufLen , " MAX " ) ;
break ;
case D3DSIO_SLT :
V_snprintf ( buff , nBufLen , " SLT " ) ;
break ;
case D3DSIO_SGE :
V_snprintf ( buff , nBufLen , " SGE " ) ;
break ;
case D3DSIO_EXP :
V_snprintf ( buff , nBufLen , " EX2 " ) ;
break ;
case D3DSIO_LOG :
V_snprintf ( buff , nBufLen , " LG2 " ) ;
break ;
case D3DSIO_LIT :
V_snprintf ( buff , nBufLen , " LIT " ) ;
break ;
case D3DSIO_DST :
V_snprintf ( buff , nBufLen , " DST " ) ;
break ;
case D3DSIO_LRP :
Assert ( ! m_bVertexShader ) ;
V_snprintf ( buff , nBufLen , " LRP " ) ;
break ;
case D3DSIO_FRC :
V_snprintf ( buff , nBufLen , " FRC " ) ;
break ;
case D3DSIO_M4x4 :
V_snprintf ( buff , nBufLen , " m4x4 " ) ;
break ;
case D3DSIO_M4x3 :
case D3DSIO_M3x4 :
case D3DSIO_M3x3 :
case D3DSIO_M3x2 :
case D3DSIO_CALL :
case D3DSIO_CALLNZ :
case D3DSIO_LOOP :
case D3DSIO_RET :
case D3DSIO_ENDLOOP :
case D3DSIO_LABEL :
TranslationError ( ) ;
break ;
case D3DSIO_DCL :
V_snprintf ( buff , nBufLen , " DCL " ) ;
break ;
case D3DSIO_POW :
V_snprintf ( buff , nBufLen , " POW " ) ;
break ;
case D3DSIO_CRS :
V_snprintf ( buff , nBufLen , " XPD " ) ;
break ;
case D3DSIO_SGN :
TranslationError ( ) ;
V_snprintf ( buff , nBufLen , " SGN " ) ;
break ;
case D3DSIO_ABS :
V_snprintf ( buff , nBufLen , " ABS " ) ;
break ;
case D3DSIO_NRM :
TranslationError ( ) ;
V_snprintf ( buff , nBufLen , " NRM " ) ;
break ;
case D3DSIO_SINCOS :
Assert ( ! m_bVertexShader ) ;
V_snprintf ( buff , nBufLen , " SCS " ) ;
break ;
case D3DSIO_REP :
case D3DSIO_ENDREP :
case D3DSIO_IF :
case D3DSIO_IFC :
case D3DSIO_ELSE :
case D3DSIO_ENDIF :
case D3DSIO_BREAK :
case D3DSIO_BREAKC :
TranslationError ( ) ;
break ;
case D3DSIO_MOVA :
Assert ( m_bVertexShader ) ;
V_snprintf ( buff , nBufLen , " MOV " ) ; // We're always moving into a temp instead, so this is MOV instead of ARL
break ;
case D3DSIO_DEFB :
case D3DSIO_DEFI :
TranslationError ( ) ;
break ;
case D3DSIO_TEXCOORD :
V_snprintf ( buff , nBufLen , " texcoord " ) ;
break ;
case D3DSIO_TEXKILL :
V_snprintf ( buff , nBufLen , " KIL " ) ;
break ;
case D3DSIO_TEX :
V_snprintf ( buff , nBufLen , " TEX " ) ;
break ;
case D3DSIO_TEXBEM :
case D3DSIO_TEXBEML :
case D3DSIO_TEXREG2AR :
case D3DSIO_TEXREG2GB :
case D3DSIO_TEXM3x2PAD :
case D3DSIO_TEXM3x2TEX :
case D3DSIO_TEXM3x3PAD :
case D3DSIO_TEXM3x3TEX :
case D3DSIO_TEXM3x3SPEC :
case D3DSIO_TEXM3x3VSPEC :
TranslationError ( ) ;
break ;
case D3DSIO_EXPP :
V_snprintf ( buff , nBufLen , " EXP " ) ;
break ;
case D3DSIO_LOGP :
V_snprintf ( buff , nBufLen , " LOG " ) ;
break ;
case D3DSIO_CND :
TranslationError ( ) ;
break ;
case D3DSIO_DEF :
V_snprintf ( buff , nBufLen , " DEF " ) ;
break ;
case D3DSIO_TEXREG2RGB :
case D3DSIO_TEXDP3TEX :
case D3DSIO_TEXM3x2DEPTH :
case D3DSIO_TEXDP3 :
case D3DSIO_TEXM3x3 :
TranslationError ( ) ;
break ;
case D3DSIO_TEXDEPTH :
V_snprintf ( buff , nBufLen , " texdepth " ) ;
break ;
case D3DSIO_CMP :
Assert ( ! m_bVertexShader ) ;
V_snprintf ( buff , nBufLen , " CMP " ) ;
break ;
case D3DSIO_BEM :
TranslationError ( ) ;
break ;
case D3DSIO_DP2ADD :
TranslationError ( ) ;
break ;
case D3DSIO_DSX :
case D3DSIO_DSY :
TranslationError ( ) ;
break ;
case D3DSIO_TEXLDD :
V_snprintf ( buff , nBufLen , " texldd " ) ;
break ;
case D3DSIO_SETP :
TranslationError ( ) ;
break ;
case D3DSIO_TEXLDL :
V_snprintf ( buff , nBufLen , " texldl " ) ;
break ;
case D3DSIO_BREAKP :
case D3DSIO_PHASE :
TranslationError ( ) ;
break ;
}
}
CUtlString D3DToGL : : GetUsageAndIndexString ( uint32 dwToken , int fSemanticFlags )
{
char szTemp [ 1024 ] ;
PrintUsageAndIndexToString ( dwToken , szTemp , sizeof ( szTemp ) , fSemanticFlags ) ;
return szTemp ;
}
//------------------------------------------------------------------------------
// Helper function which prints ASCII representation of usage-usageindex pair to string
//
// Strictly used by vertex shaders
// not used any more now that we have attribmap metadata
//------------------------------------------------------------------------------
void D3DToGL : : PrintUsageAndIndexToString ( uint32 dwToken , char * strUsageUsageIndexName , int nBufLen , int fSemanticFlags )
{
uint32 dwUsage = ( dwToken & D3DSP_DCL_USAGE_MASK ) ;
uint32 dwUsageIndex = ( dwToken & D3DSP_DCL_USAGEINDEX_MASK ) > > D3DSP_DCL_USAGEINDEX_SHIFT ;
switch ( dwUsage )
{
case D3DDECLUSAGE_POSITION :
if ( m_bVertexShader )
{
if ( fSemanticFlags & SEMANTIC_OUTPUT )
V_snprintf ( strUsageUsageIndexName , nBufLen , " vTempPos " ) ; // effectively gl_Position
else
V_snprintf ( strUsageUsageIndexName , nBufLen , " gl_Vertex " ) ;
}
else
{
// .xy = position in viewport coordinates
// .z = depth
V_snprintf ( strUsageUsageIndexName , nBufLen , " gl_FragCoord " ) ;
}
break ;
case D3DDECLUSAGE_BLENDWEIGHT :
V_snprintf ( strUsageUsageIndexName , nBufLen , " vertex.attrib[1] " ) ; // "vertex.attrib[12]" ); // or [1]
break ;
case D3DDECLUSAGE_BLENDINDICES :
V_snprintf ( strUsageUsageIndexName , nBufLen , " vertex.attrib[13] " ) ; // "vertex.attrib[13]" ); // or [ 7 ]
break ;
case D3DDECLUSAGE_NORMAL :
V_snprintf ( strUsageUsageIndexName , nBufLen , " vec4( gl_Normal, 0.0 ) " ) ;
break ;
case D3DDECLUSAGE_PSIZE :
TranslationError ( ) ;
V_snprintf ( strUsageUsageIndexName , nBufLen , " _psize " ) ; // no analog
break ;
case D3DDECLUSAGE_TEXCOORD :
V_snprintf ( strUsageUsageIndexName , nBufLen , " oT%d " , dwUsageIndex ) ;
break ;
case D3DDECLUSAGE_TANGENT :
NoteTangentInputUsed ( ) ;
V_strncpy ( strUsageUsageIndexName , g_pTangentAttributeName , nBufLen ) ;
break ;
case D3DDECLUSAGE_BINORMAL :
V_snprintf ( strUsageUsageIndexName , nBufLen , " vertex.attrib[14] " ) ; // aka texc[6]
break ;
// case D3DDECLUSAGE_TESSFACTOR:
// TranslationError();
// V_snprintf( strUsageUsageIndexName, nBufLen, "_position" ); // no analog
// break;
// case D3DDECLUSAGE_POSITIONT:
// TranslationError();
// V_snprintf( strUsageUsageIndexName, nBufLen, "_positiont" ); // no analog
// break;
case D3DDECLUSAGE_COLOR :
Assert ( dwUsageIndex < = 1 ) ;
// if ( fSemanticFlags & SEMANTIC_OUTPUT )
// V_snprintf( strUsageUsageIndexName, nBufLen, dwUsageIndex != 0 ? "gl_BackColor" : "gl_FrontColor" );
// else
V_snprintf ( strUsageUsageIndexName , nBufLen , dwUsageIndex ! = 0 ? " _gl_FrontSecondaryColor " : " _gl_FrontColor " ) ;
break ;
case D3DDECLUSAGE_FOG :
TranslationError ( ) ;
break ;
case D3DDECLUSAGE_DEPTH :
TranslationError ( ) ;
V_snprintf ( strUsageUsageIndexName , nBufLen , " _depth " ) ; // no analog
break ;
case D3DDECLUSAGE_SAMPLE :
TranslationError ( ) ;
V_snprintf ( strUsageUsageIndexName , nBufLen , " _sample " ) ; // no analog
break ;
default :
Debugger ( ) ;
break ;
}
}
uint32 D3DToGL : : GetRegType ( uint32 dwRegToken )
{
return ( ( dwRegToken & D3DSP_REGTYPE_MASK2 ) > > D3DSP_REGTYPE_SHIFT2 ) | ( ( dwRegToken & D3DSP_REGTYPE_MASK ) > > D3DSP_REGTYPE_SHIFT ) ;
}
void D3DToGL : : PrintIndentation ( char * pBuf , int nBufLen )
{
for ( int i = 0 ; i < m_NumIndentTabs ; i + + )
{
strcat_s ( pBuf , nBufLen , " \t " ) ;
}
}
CUtlString D3DToGL : : GetParameterString ( uint32 dwToken , uint32 dwSourceOrDest , bool bForceScalarSource , int * pARLDestReg )
{
char szTemp [ 1024 ] ;
PrintParameterToString ( dwToken , dwSourceOrDest , szTemp , sizeof ( szTemp ) , bForceScalarSource , pARLDestReg ) ;
return szTemp ;
}
// If the register happens to end with ".xyzw", then this strips off the mask.
void SimplifyFourParamRegister ( char * pRegister )
{
int nLen = V_strlen ( pRegister ) ;
if ( nLen > 5 & & V_strcmp ( & pRegister [ nLen - 5 ] , " .xyzw " ) = = 0 )
pRegister [ nLen - 5 ] = 0 ;
}
// This returns 0 for x, 1 for y, 2 for z, and 3 for w.
int GetSwizzleComponentVectorIndex ( char chMask )
{
if ( chMask = = ' x ' )
return 0 ;
else if ( chMask = = ' y ' )
return 1 ;
else if ( chMask = = ' z ' )
return 2 ;
else if ( chMask = = ' w ' )
return 3 ;
Error ( " GetSwizzleComponentVectorIndex( '%c' ) - invalid parameter. \n " , chMask ) ;
return 0 ;
}
// GLSL needs the # of src masks to match the dest write mask.
//
// So this:
// r0.xy = r1 + r2;
// becomes:
// r0.xy = r1.xy + r2.xy;
//
//
// Also, and this is the trickier one: GLSL reads the source registers from their first component on
// whereas D3D reads them as referenced in the dest register mask!
//
// So this code in D3D:
// r0.yz = c0.x + c1.wxyz
// Really means:
// r0.y = c0.x + c1.x
// r0.z = c0.x + c1.y
// So we translate it to this in GLSL:
// r0.yz = c0.xx + c1.wx
// r0.yz = c0.xx + c1.xy
//
CUtlString D3DToGL : : FixGLSLSwizzle ( const char * pDestRegisterName , const char * pSrcRegisterName )
{
bool bAbsWrapper = false ; // Parameter wrapped in an abs()
bool bAbsNegative = false ; // -abs()
char szSrcRegister [ 128 ] ;
V_strncpy ( szSrcRegister , pSrcRegisterName , sizeof ( szSrcRegister ) ) ;
// Check for abs() or -abs() wrapper and strip it off during the fixup
if ( ! V_strncmp ( pSrcRegisterName , " abs( " , 4 ) | | ! V_strncmp ( pSrcRegisterName , " -abs( " , 5 ) )
{
bAbsWrapper = true ;
bAbsNegative = pSrcRegisterName [ 0 ] = = ' - ' ;
const char * pOpenParen = strchr ( pSrcRegisterName , ' ( ' ) ; // FIRST opening paren
const char * pClosingParen = strrchr ( pSrcRegisterName , ' ) ' ) ; // LAST closing paren
Assert ( pOpenParen & & pClosingParen ) ; // If we start with abs( and don't get both parens, something is very wrong
// Copy out just the register name with no abs()
int nRegNameLength = pClosingParen - pOpenParen - 1 ;
V_strncpy ( szSrcRegister , pOpenParen + 1 , nRegNameLength + 1 ) ; // Kind of a weird function...copy more than you need and slam the last char to NULL-terminate
}
int nSwizzlesInDest = GetNumSwizzleComponents ( pDestRegisterName ) ;
if ( nSwizzlesInDest = = 0 )
nSwizzlesInDest = 4 ;
char szFixedSrcRegister [ 128 ] ;
GetParamNameWithoutSwizzle ( szSrcRegister , szFixedSrcRegister , sizeof ( szFixedSrcRegister ) ) ;
V_strncat ( szFixedSrcRegister , " . " , sizeof ( szFixedSrcRegister ) ) ;
for ( int i = 0 ; i < nSwizzlesInDest ; i + + )
{
char chDestWriteMask = GetSwizzleComponent ( pDestRegisterName , i ) ;
int nVectorIndex = GetSwizzleComponentVectorIndex ( chDestWriteMask ) ;
char ch [ 2 ] ;
ch [ 0 ] = GetSwizzleComponent ( szSrcRegister , nVectorIndex ) ;
ch [ 1 ] = 0 ;
V_strncat ( szFixedSrcRegister , ch , sizeof ( szFixedSrcRegister ) ) ;
}
SimplifyFourParamRegister ( szFixedSrcRegister ) ;
if ( bAbsWrapper )
{
char szTempSrcRegister [ 128 ] ;
V_strncpy ( szTempSrcRegister , szFixedSrcRegister , sizeof ( szTempSrcRegister ) ) ;
V_snprintf ( szFixedSrcRegister , sizeof ( szFixedSrcRegister ) , " %sabs(%s) " , bAbsNegative ? " - " : " " , szTempSrcRegister ) ;
}
return szFixedSrcRegister ;
}
// Weird encoding...bits are split apart in the dwToken
inline uint32 GetRegTypeFromToken ( uint32 dwToken )
{
return ( ( dwToken & D3DSP_REGTYPE_MASK2 ) > > D3DSP_REGTYPE_SHIFT2 ) | ( ( dwToken & D3DSP_REGTYPE_MASK ) > > D3DSP_REGTYPE_SHIFT ) ;
}
void D3DToGL : : FlagIndirectRegister ( uint32 dwToken , int * pARLDestReg )
{
if ( ! pARLDestReg )
return ;
switch ( dwToken & D3DVS_SWIZZLE_MASK & D3DVS_X_W )
{
case D3DVS_X_X :
* pARLDestReg = ARL_DEST_X ;
break ;
case D3DVS_X_Y :
* pARLDestReg = ARL_DEST_Y ;
break ;
case D3DVS_X_Z :
* pARLDestReg = ARL_DEST_Z ;
break ;
case D3DVS_X_W :
* pARLDestReg = ARL_DEST_W ;
break ;
}
}
//------------------------------------------------------------------------------
// PrintParameterToString()
//
// Helper function which prints ASCII representation of passed Parameter dwToken
// to string. Token defines parameter details. The dwSourceOrDest parameter says
// whether or not this is a source or destination register
//------------------------------------------------------------------------------
void D3DToGL : : PrintParameterToString ( uint32 dwToken , uint32 dwSourceOrDest , char * pRegisterName , int nBufLen , bool bForceScalarSource , int * pARLDestReg )
{
char buff [ 32 ] ;
bool bAllowWriteMask = true ;
bool bAllowSwizzle = true ;
uint32 dwRegNum = dwToken & D3DSP_REGNUM_MASK ;
uint32 dwRegType , dwSwizzle ;
uint32 dwSrcModifier = D3DSPSM_NONE ;
// Clear string to zero length
pRegisterName [ 0 ] = 0 ;
dwRegType = GetRegTypeFromToken ( dwToken ) ;
// If this is a dest register
if ( dwSourceOrDest = = DST_REGISTER )
{
// Instruction modifiers
if ( dwToken & D3DSPDM_PARTIALPRECISION )
{
// strcat_s( pRegisterName, nBufLen, "_pp" );
}
if ( dwToken & D3DSPDM_MSAMPCENTROID )
{
// strcat_s( pRegisterName, nBufLen, "_centroid" );
}
}
// If this is a source register
if ( dwSourceOrDest = = SRC_REGISTER )
{
dwSrcModifier = dwToken & D3DSP_SRCMOD_MASK ;
// If there are any source modifiers, check to see if they're at
// least partially "prefix" and prepend appropriately
if ( dwSrcModifier ! = D3DSPSM_NONE )
{
switch ( dwSrcModifier )
{
// These four start with just minus... (some may result in "postfix" notation as well later on)
case D3DSPSM_NEG : // negate
strcat_s ( pRegisterName , nBufLen , " - " ) ;
break ;
case D3DSPSM_BIASNEG : // bias and negate
case D3DSPSM_SIGNNEG : // sign and negate
case D3DSPSM_X2NEG : // *2 and negate
TranslationError ( ) ;
strcat_s ( pRegisterName , nBufLen , " - " ) ;
break ;
case D3DSPSM_COMP : // complement
TranslationError ( ) ;
strcat_s ( pRegisterName , nBufLen , " 1- " ) ;
break ;
case D3DSPSM_ABS : // abs()
strcat_s ( pRegisterName , nBufLen , " abs( " ) ;
break ;
case D3DSPSM_ABSNEG : // -abs()
strcat_s ( pRegisterName , nBufLen , " -abs( " ) ;
break ;
case D3DSPSM_NOT : // for predicate register: "!p0"
TranslationError ( ) ;
strcat_s ( pRegisterName , nBufLen , " ! " ) ;
break ;
}
}
}
// Register name (from type and number)
switch ( dwRegType )
{
case D3DSPR_TEMP :
V_snprintf ( buff , sizeof ( buff ) , " r%d " , dwRegNum ) ;
strcat_s ( pRegisterName , nBufLen , buff ) ;
m_dwTempUsageMask | = 0x00000001 < < dwRegNum ; // Keep track of the use of this temp
break ;
case D3DSPR_INPUT :
if ( ! m_bVertexShader & & ( dwSourceOrDest = = SRC_REGISTER ) )
{
if ( m_dwMajorVersion = = 3 )
{
V_snprintf ( buff , sizeof ( buff ) , " oTempT%d " , dwRegNum ) ;
}
else
{
V_snprintf ( buff , sizeof ( buff ) , dwRegNum = = 0 ? " _gl_FrontColor " : " _gl_FrontSecondaryColor " ) ;
}
strcat_s ( pRegisterName , nBufLen , buff ) ;
}
else
{
V_snprintf ( buff , sizeof ( buff ) , " v%d " , dwRegNum ) ;
strcat_s ( pRegisterName , nBufLen , buff ) ;
}
break ;
case D3DSPR_CONST :
if ( m_bConstantRegisterDefined [ dwRegNum ] )
{
char szConstantRegName [ 3 ] ;
if ( m_bVertexShader )
{
V_snprintf ( szConstantRegName , 3 , " vd " ) ;
}
else
{
V_snprintf ( szConstantRegName , 3 , " pd " ) ;
}
// Put defined constants into their own namespace "d"
V_snprintf ( buff , sizeof ( buff ) , " %s%d " , szConstantRegName , dwRegNum ) ;
strcat_s ( pRegisterName , nBufLen , buff ) ;
}
else if ( dwToken & D3DSHADER_ADDRESSMODE_MASK ) // Indirect addressing (e.g. skinning in a vertex shader)
{
char szConstantRegName [ 16 ] ;
if ( m_bVertexShader )
{
V_snprintf ( szConstantRegName , 3 , " vc " ) ;
}
else // No indirect addressing in PS, this shouldn't happen
{
TranslationError ( ) ;
V_snprintf ( szConstantRegName , 3 , " pc " ) ;
}
if ( ( m_bGenerateBoneUniformBuffer ) & & ( dwRegNum > = DXABSTRACT_VS_FIRST_BONE_SLOT ) )
{
if ( dwRegNum < DXABSTRACT_VS_LAST_BONE_SLOT )
{
dwRegNum - = DXABSTRACT_VS_FIRST_BONE_SLOT ;
V_strcpy ( szConstantRegName , " vcbones " ) ;
m_nHighestBoneRegister = ( DXABSTRACT_VS_PARAM_SLOTS - 1 ) - DXABSTRACT_VS_FIRST_BONE_SLOT ;
}
else
{
dwRegNum - = ( DXABSTRACT_VS_LAST_BONE_SLOT + 1 ) - DXABSTRACT_VS_FIRST_BONE_SLOT ;
m_nHighestRegister = m_bGenerateBoneUniformBuffer ? ( ( DXABSTRACT_VS_PARAM_SLOTS - 1 ) - ( ( DXABSTRACT_VS_LAST_BONE_SLOT + 1 ) - DXABSTRACT_VS_FIRST_BONE_SLOT ) ) : ( DXABSTRACT_VS_PARAM_SLOTS - 1 ) ;
}
}
else
{
m_nHighestRegister = m_bGenerateBoneUniformBuffer ? ( ( DXABSTRACT_VS_PARAM_SLOTS - 1 ) - ( ( DXABSTRACT_VS_LAST_BONE_SLOT + 1 ) - DXABSTRACT_VS_FIRST_BONE_SLOT ) ) : ( DXABSTRACT_VS_PARAM_SLOTS - 1 ) ;
}
// Index into single pc/vc[] register array with relative addressing
int nDstReg = - 1 ;
FlagIndirectRegister ( GetNextToken ( ) , & nDstReg ) ;
if ( pARLDestReg )
* pARLDestReg = nDstReg ;
Assert ( nDstReg ! = ARL_DEST_NONE ) ;
int nSrcSwizzle = ' x ' ;
if ( nDstReg = = ARL_DEST_Y )
nSrcSwizzle = ' y ' ;
else if ( nDstReg = = ARL_DEST_Z )
nSrcSwizzle = ' z ' ;
else if ( nDstReg = = ARL_DEST_W )
nSrcSwizzle = ' w ' ;
V_snprintf ( buff , sizeof ( buff ) , " %s[int(va_r.%c) + %d] " , szConstantRegName , nSrcSwizzle , dwRegNum ) ;
strcat_s ( pRegisterName , nBufLen , buff ) ;
// Must allow swizzling, otherwise this example doesn't compile right: mad r3.xyz, c27[a0.w].w, r3, r7
//bAllowSwizzle = false;
}
else // Direct addressing of constant array
{
char szConstantRegName [ 16 ] ;
V_snprintf ( szConstantRegName , 3 , m_bVertexShader ? " vc " : " pc " ) ;
if ( ( m_bGenerateBoneUniformBuffer ) & & ( dwRegNum > = DXABSTRACT_VS_FIRST_BONE_SLOT ) )
{
if ( dwRegNum < DXABSTRACT_VS_LAST_BONE_SLOT )
{
dwRegNum - = DXABSTRACT_VS_FIRST_BONE_SLOT ;
V_strcpy ( szConstantRegName , " vcbones " ) ;
m_nHighestBoneRegister = MAX ( m_nHighestBoneRegister , ( int ) dwRegNum ) ;
}
else
{
// handles case where constants after the bones are used (c217 onwards), these are to be concatenated with those before the bones (c0-c57)
// keep track of regnum for concatenated array
dwRegNum - = ( DXABSTRACT_VS_LAST_BONE_SLOT + 1 ) - DXABSTRACT_VS_FIRST_BONE_SLOT ;
m_nHighestRegister = MAX ( m_nHighestRegister , dwRegNum ) ;
}
}
else
{
//// NOGO if (dwRegNum != 255) // have seen cases where dwRegNum is 0xFF... need to figure out where those opcodes are coming from
{
m_nHighestRegister = MAX ( m_nHighestRegister , dwRegNum ) ;
}
Assert ( m_nHighestRegister < DXABSTRACT_VS_PARAM_SLOTS ) ;
}
// Index into single pc/vc[] register array with absolute addressing, same for GLSL and ASM
V_snprintf ( buff , sizeof ( buff ) , " %s[%d] " , szConstantRegName , dwRegNum ) ;
strcat_s ( pRegisterName , nBufLen , buff ) ;
}
break ;
case D3DSPR_ADDR : // aliases to D3DSPR_TEXTURE
if ( m_bVertexShader )
{
Assert ( dwRegNum = = 0 ) ;
V_snprintf ( buff , sizeof ( buff ) , " va_r " ) ;
}
else // D3DSPR_TEXTURE in the pixel shader
{
// If dest reg, this is an iterator/varying declaration
if ( dwSourceOrDest = = DST_REGISTER )
{
// Is this iterator centroid?
if ( m_nCentroidMask & ( 0x00000001 < < dwRegNum ) )
{
V_snprintf ( buff , sizeof ( buff ) , " centroid in vec4 oT%d " , dwRegNum ) ; // centroid varying
}
else
{
V_snprintf ( buff , sizeof ( buff ) , " in vec4 oT%d " , dwRegNum ) ;
}
bAllowWriteMask = false ;
}
else // source register
{
V_snprintf ( buff , sizeof ( buff ) , " oT%d " , dwRegNum ) ;
}
}
strcat_s ( pRegisterName , nBufLen , buff ) ;
break ;
case D3DSPR_RASTOUT : // vertex shader oPos
Assert ( m_bVertexShader ) ;
Assert ( m_dwMajorVersion = = 2 ) ;
switch ( dwRegNum )
{
case D3DSRO_POSITION :
strcat_s ( pRegisterName , nBufLen , " vTempPos " ) ; // In GLSL, this ends up in gl_Position later on
m_bDeclareVSOPos = true ;
break ;
case D3DSRO_FOG :
if ( ! m_bFogFragCoord )
{
StrcatToHeaderCode ( " varying mediump vec4 _gl_FogFragCoord; \n " ) ;
m_bFogFragCoord = true ;
}
strcat_s ( pRegisterName , nBufLen , " _gl_FogFragCoord " ) ;
m_bDeclareVSOFog = true ;
break ;
default :
printf ( " \n D3DSPR_RASTOUT: dwRegNum is %08x and token is %08x " , dwRegNum , dwToken ) ;
TranslationError ( ) ;
break ;
}
break ;
case D3DSPR_ATTROUT :
Assert ( m_bVertexShader ) ;
Assert ( m_dwMajorVersion = = 2 ) ;
if ( dwRegNum = = 0 )
{
if ( ! m_bFrontColor )
{
StrcatToHeaderCode ( " varying lowp vec4 _gl_FrontColor; \n " ) ;
m_bFrontColor = true ;
}
V_snprintf ( buff , sizeof ( buff ) , " _gl_FrontColor " ) ;
}
else if ( dwRegNum = = 1 )
{
if ( ! m_bFrontSecondaryColor )
{
StrcatToHeaderCode ( " varying lowp vec4 _gl_FrontSecondaryColor; \n " ) ;
m_bFrontSecondaryColor = true ;
}
V_snprintf ( buff , sizeof ( buff ) , " _gl_FrontSecondaryColor " ) ;
}
else
{
Error ( " Invalid D3DSPR_ATTROUT index " ) ;
}
strcat_s ( pRegisterName , nBufLen , buff ) ;
break ;
case D3DSPR_TEXCRDOUT : // aliases to D3DSPR_OUTPUT
if ( m_bVertexShader )
{
if ( m_nVSPositionOutput = = ( int32 ) dwRegNum )
{
V_snprintf ( buff , sizeof ( buff ) , " vTempPos " ) ; // This output varying is the position
}
else if ( m_dwMajorVersion = = 3 )
{
V_snprintf ( buff , sizeof ( buff ) , " oTempT%d " , dwRegNum ) ;
}
else
{
V_snprintf ( buff , sizeof ( buff ) , " oT%d " , dwRegNum ) ;
}
m_dwTexCoordOutMask | = ( 0x00000001 < < dwRegNum ) ;
}
else
{
V_snprintf ( buff , sizeof ( buff ) , " oC%d " , dwRegNum ) ;
}
strcat_s ( pRegisterName , nBufLen , buff ) ;
break ;
case D3DSPR_CONSTINT :
V_snprintf ( buff , sizeof ( buff ) , " i%d " , dwRegNum ) ; // Loops use these
strcat_s ( pRegisterName , nBufLen , buff ) ;
m_dwConstIntUsageMask | = 0x00000001 < < dwRegNum ; // Keep track of the use of this integer constant
break ;
case D3DSPR_COLOROUT :
if ( dwRegNum + 1 > m_iFragDataCount )
m_iFragDataCount = dwRegNum + 1 ;
V_snprintf ( buff , sizeof ( buff ) , " gl_FragData[%d] " , dwRegNum ) ;
strcat_s ( pRegisterName , nBufLen , buff ) ;
m_bOutputColorRegister [ dwRegNum ] = true ;
break ;
case D3DSPR_DEPTHOUT :
V_snprintf ( buff , sizeof ( buff ) , " gl_FragDepth " ) ;
strcat_s ( pRegisterName , nBufLen , buff ) ;
m_bOutputDepthRegister = true ;
break ;
case D3DSPR_SAMPLER :
V_snprintf ( buff , sizeof ( buff ) , " sampler%d " , dwRegNum ) ;
strcat_s ( pRegisterName , nBufLen , buff ) ;
break ;
case D3DSPR_CONST2 :
TranslationError ( ) ;
V_snprintf ( buff , sizeof ( buff ) , " c%d " , dwRegNum + 2048 ) ;
strcat_s ( pRegisterName , nBufLen , buff ) ;
break ;
case D3DSPR_CONST3 :
TranslationError ( ) ;
V_snprintf ( buff , sizeof ( buff ) , " c%d " , dwRegNum + 4096 ) ;
strcat_s ( pRegisterName , nBufLen , buff ) ;
break ;
case D3DSPR_CONST4 :
TranslationError ( ) ;
V_snprintf ( buff , sizeof ( buff ) , " c%d " , dwRegNum + 6144 ) ;
strcat_s ( pRegisterName , nBufLen , buff ) ;
break ;
case D3DSPR_CONSTBOOL :
V_snprintf ( buff , sizeof ( buff ) , m_bVertexShader ? " b%d " : " fb%d " , dwRegNum ) ;
strcat_s ( pRegisterName , nBufLen , buff ) ;
m_dwConstBoolUsageMask | = 0x00000001 < < dwRegNum ; // Keep track of the use of this bool constant
break ;
case D3DSPR_LOOP :
TranslationError ( ) ;
V_snprintf ( buff , sizeof ( buff ) , " aL%d " , dwRegNum ) ;
strcat_s ( pRegisterName , nBufLen , buff ) ;
break ;
case D3DSPR_TEMPFLOAT16 :
TranslationError ( ) ;
V_snprintf ( buff , sizeof ( buff ) , " temp_float16_xxx%d " , dwRegNum ) ;
strcat_s ( pRegisterName , nBufLen , buff ) ;
break ;
case D3DSPR_MISCTYPE :
Assert ( dwRegNum = = 0 ) ; // So far, we know that MISC[0] is gl_FragCoord (aka vPos in DX ASM parlance), but we don't know about any other MISC registers
V_snprintf ( buff , sizeof ( buff ) , " gl_FragCoord " ) ;
strcat_s ( pRegisterName , nBufLen , buff ) ;
break ;
case D3DSPR_LABEL :
TranslationError ( ) ;
V_snprintf ( buff , sizeof ( buff ) , " label%d " , dwRegNum ) ;
strcat_s ( pRegisterName , nBufLen , buff ) ;
break ;
case D3DSPR_PREDICATE :
TranslationError ( ) ;
V_snprintf ( buff , sizeof ( buff ) , " p%d " , dwRegNum ) ;
strcat_s ( pRegisterName , nBufLen , buff ) ;
break ;
}
// If this is a dest register
if ( dwSourceOrDest = = DST_REGISTER )
{
//
// Write masks
//
// If some (not all, not none) of the write masks are set, we should include them
//
if ( bAllowWriteMask & & ( ! ( ( dwToken & D3DSP_WRITEMASK_ALL ) = = D3DSP_WRITEMASK_ALL ) | | ( ( dwToken & D3DSP_WRITEMASK_ALL ) = = 0x00000000 ) ) )
{
// Put the dot on there
strcat_s ( pRegisterName , nBufLen , " . " ) ;
// Optionally put on the x, y, z or w
int nMasksWritten = 0 ;
if ( dwToken & D3DSP_WRITEMASK_0 )
{
strcat_s ( pRegisterName , nBufLen , " x " ) ;
+ + nMasksWritten ;
}
if ( dwToken & D3DSP_WRITEMASK_1 )
{
strcat_s ( pRegisterName , nBufLen , " y " ) ;
+ + nMasksWritten ;
}
if ( dwToken & D3DSP_WRITEMASK_2 )
{
strcat_s ( pRegisterName , nBufLen , " z " ) ;
+ + nMasksWritten ;
}
if ( dwToken & D3DSP_WRITEMASK_3 )
{
strcat_s ( pRegisterName , nBufLen , " w " ) ;
+ + nMasksWritten ;
}
}
}
else // must be a source register
{
if ( bAllowSwizzle ) // relative addressing hard-codes the swizzle on a0.x
{
uint32 dwXSwizzle , dwYSwizzle , dwZSwizzle , dwWSwizzle ;
// Mask out the swizzle modifier
dwSwizzle = dwToken & D3DVS_SWIZZLE_MASK ;
// If there are any swizzles at all, tack on the appropriate notation
if ( dwSwizzle ! = D3DVS_NOSWIZZLE )
{
// Separate out the two-bit codes for each component swizzle
dwXSwizzle = dwSwizzle & D3DVS_X_W ;
dwYSwizzle = dwSwizzle & D3DVS_Y_W ;
dwZSwizzle = dwSwizzle & D3DVS_Z_W ;
dwWSwizzle = dwSwizzle & D3DVS_W_W ;
// Put on the dot
strcat_s ( pRegisterName , nBufLen , " . " ) ;
// See where X comes from
switch ( dwXSwizzle )
{
case D3DVS_X_X :
strcat_s ( pRegisterName , nBufLen , " x " ) ;
break ;
case D3DVS_X_Y :
strcat_s ( pRegisterName , nBufLen , " y " ) ;
break ;
case D3DVS_X_Z :
strcat_s ( pRegisterName , nBufLen , " z " ) ;
break ;
case D3DVS_X_W :
strcat_s ( pRegisterName , nBufLen , " w " ) ;
break ;
}
if ( ! bForceScalarSource )
{
// If the source of the remaining components are aren't
// identical to the source of x, continue with swizzle
if ( ( ( dwXSwizzle > > D3DVS_SWIZZLE_SHIFT ) ! = ( dwYSwizzle > > ( D3DVS_SWIZZLE_SHIFT + 2 ) ) ) | | // X and Y sources match?
( ( dwXSwizzle > > D3DVS_SWIZZLE_SHIFT ) ! = ( dwZSwizzle > > ( D3DVS_SWIZZLE_SHIFT + 4 ) ) ) | | // X and Z sources match?
( ( dwXSwizzle > > D3DVS_SWIZZLE_SHIFT ) ! = ( dwWSwizzle > > ( D3DVS_SWIZZLE_SHIFT + 6 ) ) ) ) // X and W sources match?
{
// OpenGL seems to want us to have either 1 or 4 components in a swizzle, so just plow on through the rest
switch ( dwYSwizzle )
{
case D3DVS_Y_X :
strcat_s ( pRegisterName , nBufLen , " x " ) ;
break ;
case D3DVS_Y_Y :
strcat_s ( pRegisterName , nBufLen , " y " ) ;
break ;
case D3DVS_Y_Z :
strcat_s ( pRegisterName , nBufLen , " z " ) ;
break ;
case D3DVS_Y_W :
strcat_s ( pRegisterName , nBufLen , " w " ) ;
break ;
}
switch ( dwZSwizzle )
{
case D3DVS_Z_X :
strcat_s ( pRegisterName , nBufLen , " x " ) ;
break ;
case D3DVS_Z_Y :
strcat_s ( pRegisterName , nBufLen , " y " ) ;
break ;
case D3DVS_Z_Z :
strcat_s ( pRegisterName , nBufLen , " z " ) ;
break ;
case D3DVS_Z_W :
strcat_s ( pRegisterName , nBufLen , " w " ) ;
break ;
}
switch ( dwWSwizzle )
{
case D3DVS_W_X :
strcat_s ( pRegisterName , nBufLen , " x " ) ;
break ;
case D3DVS_W_Y :
strcat_s ( pRegisterName , nBufLen , " y " ) ;
break ;
case D3DVS_W_Z :
strcat_s ( pRegisterName , nBufLen , " z " ) ;
break ;
case D3DVS_W_W :
strcat_s ( pRegisterName , nBufLen , " w " ) ;
break ;
}
}
} // end !bForceScalarSource
}
else // dwSwizzle == D3DVS_NOSWIZZLE
{
// If this is a MOVA / ARL, GL on the Mac requires us to tack the .x onto the source register
if ( bForceScalarSource )
{
strcat_s ( pRegisterName , nBufLen , " .x " ) ;
}
}
} // bAllowSwizzle
// If there are any source modifiers, check to see if they're at
// least partially "postfix" and tack them on as appropriate
if ( dwSrcModifier ! = D3DSPSM_NONE )
{
switch ( dwSrcModifier )
{
case D3DSPSM_BIAS : // bias
case D3DSPSM_BIASNEG : // bias and negate
TranslationError ( ) ;
strcat_s ( pRegisterName , nBufLen , " _bx2 " ) ;
break ;
case D3DSPSM_SIGN : // sign
case D3DSPSM_SIGNNEG : // sign and negate
TranslationError ( ) ;
strcat_s ( pRegisterName , nBufLen , " _sgn " ) ;
break ;
case D3DSPSM_X2 : // *2
case D3DSPSM_X2NEG : // *2 and negate
TranslationError ( ) ;
strcat_s ( pRegisterName , nBufLen , " _x2 " ) ;
break ;
case D3DSPSM_ABS : // abs()
case D3DSPSM_ABSNEG : // -abs()
strcat_s ( pRegisterName , nBufLen , " ) " ) ;
break ;
case D3DSPSM_DZ : // divide through by z component
TranslationError ( ) ;
strcat_s ( pRegisterName , nBufLen , " _dz " ) ;
break ;
case D3DSPSM_DW : // divide through by w component
TranslationError ( ) ;
strcat_s ( pRegisterName , nBufLen , " _dw " ) ;
break ;
}
} // end postfix modifiers (really only ps.1.x)
}
}
void D3DToGL : : RecordInputAndOutputPositions ( )
{
// Remember where we are in the token stream.
m_pRecordedInputTokenStart = m_pdwNextToken ;
// Remember where our outputs are.
m_nRecordedParamCodeStrlen = V_strlen ( ( char * ) m_pBufParamCode - > Base ( ) ) ;
m_nRecordedALUCodeStrlen = V_strlen ( ( char * ) m_pBufALUCode - > Base ( ) ) ;
m_nRecordedAttribCodeStrlen = V_strlen ( ( char * ) m_pBufAttribCode - > Base ( ) ) ;
}
void D3DToGL : : AddTokenHexCodeToBuffer ( char * pBuffer , int nSize , int nLastStrlen )
{
int nCurStrlen = V_strlen ( pBuffer ) ;
if ( nCurStrlen = = nLastStrlen )
return ;
// Build a string with all the hex codes of the tokens since last time.
char szHex [ 512 ] ;
szHex [ 0 ] = ' \n ' ;
V_snprintf ( & szHex [ 1 ] , sizeof ( szHex ) - 1 , HEXCODE_HEADER ) ;
int nTokens = MIN ( 10 , m_pdwNextToken - m_pRecordedInputTokenStart ) ;
for ( int i = 0 ; i < nTokens ; i + + )
{
char szTemp [ 32 ] ;
V_snprintf ( szTemp , sizeof ( szTemp ) , " 0x%x " , m_pRecordedInputTokenStart [ i ] ) ;
V_strncat ( szHex , szTemp , sizeof ( szHex ) ) ;
}
V_strncat ( szHex , " \n " , sizeof ( szHex ) ) ;
// Insert the hex codes into the string.
int nBytesToInsert = V_strlen ( szHex ) ;
if ( nCurStrlen + nBytesToInsert + 1 > = nSize )
Error ( " Buffer overflow writing token hex codes " ) ;
if ( m_bPutHexCodesAfterLines )
{
// Put it at the end of the last line.
if ( pBuffer [ nCurStrlen - 1 ] = = ' \n ' )
pBuffer [ nCurStrlen - 1 ] = 0 ;
V_strncat ( pBuffer , & szHex [ 1 ] , nSize ) ;
}
else
{
memmove ( pBuffer + nLastStrlen + nBytesToInsert , pBuffer + nLastStrlen , nCurStrlen - nLastStrlen + 1 ) ;
memcpy ( pBuffer + nLastStrlen , szHex , nBytesToInsert ) ;
}
}
void D3DToGL : : AddTokenHexCode ( )
{
if ( m_pdwNextToken > m_pRecordedInputTokenStart )
{
AddTokenHexCodeToBuffer ( ( char * ) m_pBufParamCode - > Base ( ) , m_pBufParamCode - > Size ( ) , m_nRecordedParamCodeStrlen ) ;
AddTokenHexCodeToBuffer ( ( char * ) m_pBufALUCode - > Base ( ) , m_pBufALUCode - > Size ( ) , m_nRecordedALUCodeStrlen ) ;
AddTokenHexCodeToBuffer ( ( char * ) m_pBufAttribCode - > Base ( ) , m_pBufAttribCode - > Size ( ) , m_nRecordedAttribCodeStrlen ) ;
}
}
uint32 D3DToGL : : MaintainAttributeMap ( uint32 dwToken , uint32 dwRegToken )
{
// Check that this reg index has not been used before - if it has, let Houston know
uint dwRegIndex = dwRegToken & D3DSP_REGNUM_MASK ;
if ( m_dwAttribMap [ dwRegIndex ] = = 0xFFFFFFFF )
{
// log it
// semantic/usage in the higher nibble
// usage index in the low nibble
uint usage = dwToken & D3DSP_DCL_USAGE_MASK ;
uint usageindex = ( dwToken & D3DSP_DCL_USAGEINDEX_MASK ) > > D3DSP_DCL_USAGEINDEX_SHIFT ;
m_dwAttribMap [ dwRegIndex ] = ( usage < < 4 ) | usageindex ;
// avoid writing 0xBB since runtime code uses that for an 'unused' marker
if ( m_dwAttribMap [ dwRegIndex ] = = 0xBB )
{
Debugger ( ) ;
}
}
else
{
//not OK
Debugger ( ) ;
}
return dwRegIndex ;
}
void D3DToGL : : Handle_DCL ( )
{
uint32 dwToken = GetNextToken ( ) ; // What kind of dcl is this...
uint32 dwRegToken = GetNextToken ( ) ; // Look ahead to register token
uint32 dwUsage = ( dwToken & D3DSP_DCL_USAGE_MASK ) ;
uint32 dwUsageIndex = ( dwToken & D3DSP_DCL_USAGEINDEX_MASK ) > > D3DSP_DCL_USAGEINDEX_SHIFT ;
uint32 dwRegNum = dwRegToken & D3DSP_REGNUM_MASK ;
uint32 nRegType = GetRegTypeFromToken ( dwRegToken ) ;
if ( m_bVertexShader )
{
// If this is an output, remember the index (what the ASM code calls o0, o1, o2..) and the semantic.
// When GetParameterString( DST_REGISTER ) hits this one, we'll return "oN".
// At the end of the main() function, we'll insert a bunch of statements like "gl_Color = o2" based on what we remembered here.
if ( ( m_dwMajorVersion > = 3 ) & & ( nRegType = = D3DSPR_OUTPUT ) )
{
// uint32 dwRegComponents = ( dwRegToken & D3DSP_WRITEMASK_ALL ) >> 16; // Components used by the output register (1 means float, 3 means vec2, 7 means vec3, f means vec4)
if ( dwRegNum > = MAX_DECLARED_OUTPUTS )
Error ( " Output register number (%d) too high (only %d supported). " , dwRegNum , MAX_DECLARED_OUTPUTS ) ;
if ( m_DeclaredOutputs [ dwRegNum ] ! = UNDECLARED_OUTPUT )
Error ( " Output dcl_ hit for register #%d more than once! " , dwRegNum ) ;
Assert ( dwToken ! = UNDECLARED_OUTPUT ) ;
m_DeclaredOutputs [ dwRegNum ] = dwToken ;
//uint32 dwUsage = ( dwToken & D3DSP_DCL_USAGE_MASK );
//uint32 dwUsageIndex = ( dwToken & D3DSP_DCL_USAGEINDEX_MASK ) >> D3DSP_DCL_USAGEINDEX_SHIFT;
// Flag which o# output register maps to gl_Position
if ( dwUsage = = D3DDECLUSAGE_POSITION )
{
m_nVSPositionOutput = dwUsageIndex ;
m_bDeclareVSOPos = true ;
}
if ( m_bAddHexCodeComments )
{
CUtlString sParam2 = GetUsageAndIndexString ( dwToken , SEMANTIC_OUTPUT ) ;
PrintToBuf ( * m_pBufHeaderCode , " // [GL remembering that oT%d maps to %s] \n " , dwRegNum , sParam2 . String ( ) ) ;
}
}
else if ( GetRegType ( dwRegToken ) = = D3DSPR_SAMPLER )
{
// We can support vertex texturing if necessary, but I can't find a use case in any branch. (HW morphing in L4D2 isn't enabled, and the comments indicate that r_hwmorph isn't compatible with mat_queue_mode anyway, and CS:GO/DoTA don't use vertex shader texturing.)
TranslationError ( ) ;
int nRegNum = dwRegToken & D3DSP_REGNUM_MASK ;
switch ( TextureType ( dwToken ) )
{
default :
case D3DSTT_UNKNOWN :
case D3DSTT_2D :
m_dwSamplerTypes [ nRegNum ] = SAMPLER_TYPE_2D ;
break ;
case D3DSTT_CUBE :
m_dwSamplerTypes [ nRegNum ] = SAMPLER_TYPE_CUBE ;
break ;
case D3DSTT_VOLUME :
m_dwSamplerTypes [ nRegNum ] = SAMPLER_TYPE_3D ;
break ;
}
// Track sampler declarations
m_dwSamplerUsageMask | = 1 < < nRegNum ;
}
else
{
Assert ( GetRegType ( dwRegToken ) = = D3DSPR_INPUT ) ;
CUtlString sParam1 = GetParameterString ( dwRegToken , DST_REGISTER , false , NULL ) ;
CUtlString sParam2 = GetUsageAndIndexString ( dwToken , SEMANTIC_INPUT ) ;
sParam2 = FixGLSLSwizzle ( sParam1 , sParam2 ) ;
PrintToBuf ( * m_pBufHeaderCode , " in vec4 %s; // " , sParam1 . String ( ) ) ;
MaintainAttributeMap ( dwToken , dwRegToken ) ;
char temp [ 128 ] ;
// regnum goes straight into the vertex.attrib[n] index
sprintf ( temp , " %08x %08x \n " , dwToken , dwRegToken ) ;
StrcatToHeaderCode ( temp ) ;
}
}
else // Pixel shader
{
// If the register is a sampler, the dcl has a dimension decorator that we have to save for subsequent TEX instructions
uint32 nRegType = GetRegType ( dwRegToken ) ;
if ( nRegType = = D3DSPR_SAMPLER )
{
int nRegNum = dwRegToken & D3DSP_REGNUM_MASK ;
switch ( TextureType ( dwToken ) )
{
default :
case D3DSTT_UNKNOWN :
case D3DSTT_2D :
m_dwSamplerTypes [ nRegNum ] = SAMPLER_TYPE_2D ;
break ;
case D3DSTT_CUBE :
m_dwSamplerTypes [ nRegNum ] = SAMPLER_TYPE_CUBE ;
break ;
case D3DSTT_VOLUME :
m_dwSamplerTypes [ nRegNum ] = SAMPLER_TYPE_3D ;
break ;
}
// Track sampler declarations
m_dwSamplerUsageMask | = 1 < < nRegNum ;
}
else // Not a sampler, we're going to generate varying declaration code
{
// In pixel shaders we only declare texture coordinate varyings since they may be using centroid
if ( ( m_dwMajorVersion = = 3 ) & & ( nRegType = = D3DSPR_INPUT ) )
{
Assert ( m_DeclaredInputs [ dwRegNum ] = = UNDECLARED_INPUT ) ;
m_DeclaredInputs [ dwRegNum ] = dwToken ;
if ( ( dwUsage ! = D3DDECLUSAGE_COLOR ) & & ( dwUsage ! = D3DDECLUSAGE_TEXCOORD ) )
{
TranslationError ( ) ; // Not supported yet, but can be if we need it.
}
if ( dwUsage = = D3DDECLUSAGE_TEXCOORD )
{
char buf [ 256 ] ;
if ( m_nCentroidMask & ( 0x00000001 < < dwUsageIndex ) )
{
V_snprintf ( buf , sizeof ( buf ) , " centroid in vec4 oT%d; \n " , dwUsageIndex ) ; // centroid varying
}
else
{
V_snprintf ( buf , sizeof ( buf ) , " in vec4 oT%d; \n " , dwUsageIndex ) ;
}
StrcatToHeaderCode ( buf ) ;
}
}
else if ( nRegType = = D3DSPR_TEXTURE )
{
char buff [ 256 ] ;
PrintParameterToString ( dwRegToken , DST_REGISTER , buff , sizeof ( buff ) , false , NULL ) ;
PrintToBuf ( * m_pBufHeaderCode , " %s; \n " , buff ) ;
}
else
{
// No need to declare anything (probably D3DSPR_MISCTYPE either VPOS or VFACE)
}
}
}
}
static bool IsFloatNaN ( float f )
{
const uint nBits = * reinterpret_cast < uint * > ( & f ) ;
const uint nExponent = ( nBits > > 23 ) & 0xFF ;
return ( nExponent = = 255 ) ;
}
static inline bool EqualTol ( double a , double b , double t )
{
return fabs ( a - b ) < = ( ( MAX ( fabs ( a ) , fabs ( b ) ) + 1.0 ) * t ) ;
}
// Originally written by Bruce Dawson, see:
// See http://randomascii.wordpress.com/2012/03/08/float-precisionfrom-zero-to-100-digits-2/
// This class represents a very limited high-precision number with 'count' 32-bit
// unsigned elements.
template < int count >
struct HighPrec
{
typedef unsigned T ;
typedef unsigned long long Product_t ;
static const int kWordShift = 32 ;
HighPrec ( )
{
memset ( m_data , 0 , sizeof ( m_data ) ) ;
m_nLowestNonZeroIndex = ARRAYSIZE ( m_data ) ;
}
// Insert the bits from value into m_data, shifted in from the bottom (least
// significant end) by the specified number of bits. A shift of zero or less
// means that none of the bits will be shifted in. A shift of one means that
// the high bit of value will be in the bottom of the last element of m_data -
// the least significant bit. A shift of kWordShift means that value will be
// in the least significant element of m_data, and so on.
void InsertLowBits ( T value , int shiftAmount )
{
if ( shiftAmount < = 0 )
return ;
int subShift = shiftAmount & ( kWordShift - 1 ) ;
int bigShift = shiftAmount / kWordShift ;
Product_t result = ( Product_t ) value < < subShift ;
T resultLow = ( T ) result ;
T resultHigh = result > > kWordShift ;
// Use an unsigned type so that negative numbers will become large,
// which makes the range checking below simpler.
unsigned highIndex = ARRAYSIZE ( m_data ) - 1 - bigShift ;
// Write the results to the data array. If the index is too large
// then that means that the data was shifted off the edge.
if ( ( highIndex < ARRAYSIZE ( m_data ) ) & & ( resultHigh ) )
{
m_data [ highIndex ] | = resultHigh ;
m_nLowestNonZeroIndex = MIN ( m_nLowestNonZeroIndex , highIndex ) ;
}
if ( ( highIndex + 1 < ARRAYSIZE ( m_data ) ) & & ( resultLow ) )
{
m_data [ highIndex + 1 ] | = resultLow ;
m_nLowestNonZeroIndex = MIN ( m_nLowestNonZeroIndex , highIndex + 1 ) ;
}
}
// Insert the bits from value into m_data, shifted in from the top (most
// significant end) by the specified number of bits. A shift of zero or less
// means that none of the bits will be shifted in. A shift of one means that
// the low bit of value will be in the top of the first element of m_data -
// the most significant bit. A shift of kWordShift means that value will be
// in the most significant element of m_data, and so on.
void InsertTopBits ( T value , int shiftAmount )
{
InsertLowBits ( value , ( ARRAYSIZE ( m_data ) + 1 ) * kWordShift - shiftAmount ) ;
}
// Return true if all elements of m_data are zero.
bool IsZero ( ) const
{
bool bIsZero = ( m_nLowestNonZeroIndex = = ARRAYSIZE ( m_data ) ) ;
# ifdef DEBUG
for ( int i = 0 ; i < ARRAYSIZE ( m_data ) ; + + i )
{
if ( m_data [ i ] )
{
Assert ( ! bIsZero ) ;
return false ;
}
}
Assert ( bIsZero ) ;
# endif
return bIsZero ;
}
// Divide by div and return the remainder, from 0 to div-1.
// Standard long-division algorithm.
T DivReturnRemainder ( T divisor )
{
T remainder = 0 ;
# ifdef DEBUG
for ( uint j = 0 ; j < m_nLowestNonZeroIndex ; + + j )
{
Assert ( m_data [ j ] = = 0 ) ;
}
# endif
int nNewLowestNonZeroIndex = ARRAYSIZE ( m_data ) ;
for ( int i = m_nLowestNonZeroIndex ; i < ARRAYSIZE ( m_data ) ; + + i )
{
Product_t dividend = ( ( Product_t ) remainder < < kWordShift ) + m_data [ i ] ;
Product_t result = dividend / divisor ;
remainder = T ( dividend % divisor ) ;
m_data [ i ] = T ( result ) ;
if ( ( result ) & & ( nNewLowestNonZeroIndex = = ARRAYSIZE ( m_data ) ) )
nNewLowestNonZeroIndex = i ;
}
m_nLowestNonZeroIndex = nNewLowestNonZeroIndex ;
return remainder ;
}
// The individual 'digits' (32-bit unsigned integers actually) that
// make up the number. The most-significant digit is in m_data[0].
T m_data [ count ] ;
uint m_nLowestNonZeroIndex ;
} ;
union Double_t
{
Double_t ( double num = 0.0f ) : f ( num ) { }
// Portable extraction of components.
bool Negative ( ) const { return ( i > > 63 ) ! = 0 ; }
int64_t RawMantissa ( ) const { return i & ( ( 1LL < < 52 ) - 1 ) ; }
int64_t RawExponent ( ) const { return ( i > > 52 ) & 0x7FF ; }
int64_t i ;
double f ;
} ;
static uint PrintDoubleInt ( char * pBuf , uint nBufSize , double f , uint nMinChars )
{
static const char * pDigits = " 00010203040506070809101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899 " ;
Assert ( ! nMinChars | | ( ( nMinChars % 6 ) = = 0 ) ) ;
char * pLastChar = pBuf + nBufSize - 1 ;
char * pDst = pLastChar ;
* pDst - - = ' \0 ' ;
// Put the double in our magic union so we can grab the components.
union Double_t num ( f ) ;
// Get the character that represents the sign.
// Check for NaNs or infinity.
if ( num . RawExponent ( ) = = 2047 )
{
TranslationError ( ) ;
}
// Adjust for the exponent bias.
int exponentValue = int ( num . RawExponent ( ) - 1023 ) ;
// Add the implied one to the mantissa.
uint64_t mantissaValue = ( 1ll < < 52 ) + num . RawMantissa ( ) ;
// Special-case for denormals - no special exponent value and
// no implied one.
if ( num . RawExponent ( ) = = 0 )
{
exponentValue = - 1022 ;
mantissaValue = num . RawMantissa ( ) ;
}
uint32_t mantissaHigh = mantissaValue > > 32 ;
uint32_t mantissaLow = mantissaValue & 0xFFFFFFFF ;
// The first bit of the mantissa has an implied value of one and this can
// be shifted 1023 positions to the left, so that's 1024 bits to the left
// of the binary point, or 32 32-bit words for the integer part.
HighPrec < 32 > intPart ;
// When our exponentValue is zero (a number in the 1.0 to 2.0 range)
// we have a 53-bit mantissa and the implied value of the highest bit
// is 1. We need to shift 12 bits in from the bottom to get that 53rd bit
// into the ones spot in the integral portion.
// To complicate it a bit more we have to insert the mantissa as two parts.
intPart . InsertLowBits ( mantissaHigh , 12 + exponentValue ) ;
intPart . InsertLowBits ( mantissaLow , 12 + exponentValue - 32 ) ;
bool bAnyDigitsLeft ;
do
{
uint remainder = intPart . DivReturnRemainder ( 1000000 ) ; // 10^6
uint origRemainer = remainder ; ( void ) origRemainer ;
bAnyDigitsLeft = ! intPart . IsZero ( ) ;
if ( bAnyDigitsLeft )
{
uint n = remainder % 100U ; remainder / = 100U ; * reinterpret_cast < uint16 * > ( pDst - 1 ) = reinterpret_cast < const uint16 * > ( pDigits ) [ n ] ;
n = remainder % 100U ; remainder / = 100U ; * reinterpret_cast < uint16 * > ( pDst - 1 - 2 ) = reinterpret_cast < const uint16 * > ( pDigits ) [ n ] ;
Assert ( remainder < 100U ) ;
* reinterpret_cast < uint16 * > ( pDst - 1 - 4 ) = reinterpret_cast < const uint16 * > ( pDigits ) [ remainder ] ;
pDst - = 6 ;
}
else
{
uint n = remainder % 100U ; remainder / = 100U ; * reinterpret_cast < uint16 * > ( pDst - 1 ) = reinterpret_cast < const uint16 * > ( pDigits ) [ n ] ; - - pDst ; if ( ( n > = 10 ) | | ( remainder ) ) - - pDst ;
if ( remainder )
{
n = remainder % 100U ; remainder / = 100U ; * reinterpret_cast < uint16 * > ( pDst - 1 ) = reinterpret_cast < const uint16 * > ( pDigits ) [ n ] ; - - pDst ; if ( ( n > = 10 ) | | ( remainder ) ) - - pDst ;
if ( remainder )
{
Assert ( remainder < 100U ) ;
* reinterpret_cast < uint16 * > ( pDst - 1 ) = reinterpret_cast < const uint16 * > ( pDigits ) [ remainder ] ; - - pDst ; if ( remainder > = 10 ) - - pDst ;
}
}
}
} while ( bAnyDigitsLeft ) ;
uint l = pLastChar - pDst ;
while ( ( l - 1 ) < nMinChars )
{
* pDst - - = ' 0 ' ;
l + + ;
}
Assert ( ( int ) l = = ( pLastChar - pDst ) ) ;
Assert ( l < = nBufSize ) ;
memmove ( pBuf , pDst + 1 , l ) ;
return l - 1 ;
}
// FloatToString is equivalent to sprintf( "%.12f" ), but doesn't have any dependencies on the current locale setting.
// Unfortunately, high accuracy radix conversion is actually pretty tricky to do right.
// Most importantly, this function has the same max roundtrip (IEEE->ASCII->IEEE) error as the MS CRT functions and can reliably handle extremely large inputs.
static void FloatToString ( char * pBuf , uint nBufSize , double fConst )
{
char * pEnd = pBuf + nBufSize ;
char * pDst = pBuf ;
double flVal = fConst ;
if ( IsFloatNaN ( flVal ) )
{
flVal = 0 ;
}
if ( flVal < 0.0f )
{
* pDst + + = ' - ' ;
flVal = - flVal ;
}
double flInt ;
double flFract = modf ( flVal , & flInt ) ;
flFract = floor ( flFract * 1000000000000.0 + .5 ) ;
if ( ! flInt )
{
* pDst + + = ' 0 ' ;
}
else
{
uint l = PrintDoubleInt ( pDst , pEnd - pDst , flInt , 0 ) ;
pDst + = l ;
}
* pDst + + = ' . ' ;
if ( ! flFract )
{
* pDst + + = ' 0 ' ;
* pDst + + = ' \0 ' ;
}
else
{
uint l = PrintDoubleInt ( pDst , pEnd - pDst , flFract , 12 ) ;
pDst + = l ;
StripExtraTrailingZeros ( pBuf ) ; // Turn 1.00000 into 1.0
}
}
#if 0
# include "vstdlib/random.h"
static void TestFloatConversion ( )
{
for ( ; ; )
{
double fConst ;
switch ( rand ( ) % 4 )
{
case 0 :
fConst = RandomFloat ( - 1e-30 , 1e+30 ) ; break ;
case 1 :
fConst = RandomFloat ( - 1e-10 , 1e+10 ) ; break ;
case 2 :
fConst = RandomFloat ( - 1e-5 , 1e+5 ) ; break ;
default :
fConst = RandomFloat ( - 1 , 1 ) ; break ;
}
char szTemp [ 1024 ] ;
// FloatToString does not rely on V_snprintf(), so it can't be affected by the current locale setting.
FloatToString ( szTemp , sizeof ( szTemp ) , fConst ) ;
static double flMaxErr1 ;
static double flMaxErr2 ;
// Compare FloatToString()'s results vs. V_snprintf()'s, also track maximum error of each.
double flCheck = atof ( szTemp ) ;
double flErr = fabs ( flCheck - fConst ) ;
flMaxErr1 = MAX ( flMaxErr1 , flErr ) ;
Assert ( EqualTol ( flCheck , fConst , .000000125 ) ) ;
char szTemp2 [ 256 ] ;
V_snprintf ( szTemp2 , sizeof ( szTemp2 ) , " %.12f " , fConst ) ;
StripExtraTrailingZeros ( szTemp2 ) ;
if ( ! strchr ( szTemp2 , ' . ' ) )
{
V_strncat ( szTemp2 , " .0 " , sizeof ( szTemp2 ) ) ;
}
double flCheck2 = atof ( szTemp2 ) ;
double flErr2 = fabs ( flCheck2 - fConst ) ;
flMaxErr2 = MAX ( flMaxErr2 , flErr2 ) ;
Assert ( EqualTol ( flCheck2 , fConst , .000000125 ) ) ;
if ( flMaxErr1 > flMaxErr2 )
{
GLMDebugPrintf ( " ! \n " ) ;
}
}
}
# endif
void D3DToGL : : Handle_DEFIB ( uint32 instruction )
{
Assert ( ( instruction = = D3DSIO_DEFI ) | | ( instruction = = D3DSIO_DEFB ) ) ;
// which register is being defined
uint32 dwToken = GetNextToken ( ) ;
uint32 nRegNum = dwToken & D3DSP_REGNUM_MASK ;
uint32 regType = GetRegTypeFromToken ( dwToken ) ;
if ( regType = = D3DSPR_CONSTINT )
{
m_dwDefConstIntUsageMask | = ( 1 < < nRegNum ) ;
uint x = GetNextToken ( ) ;
uint y = GetNextToken ( ) ;
uint z = GetNextToken ( ) ;
uint w = GetNextToken ( ) ;
NOTE_UNUSED ( y ) ; NOTE_UNUSED ( z ) ; NOTE_UNUSED ( w ) ;
Assert ( nRegNum < 32 ) ;
if ( nRegNum < 32 )
{
m_dwDefConstIntIterCount [ nRegNum ] = x ;
}
}
else
{
TranslationError ( ) ;
}
}
void D3DToGL : : Handle_DEF ( )
{
//TestFloatConversion();
//
// JasonM TODO: catch D3D's sincos-specific D3DSINCOSCONST1 and D3DSINCOSCONST2 constants and filter them out here
//
// Which register is being defined
uint32 dwToken = GetNextToken ( ) ;
// Note that this constant was explicitly defined
m_bConstantRegisterDefined [ dwToken & D3DSP_REGNUM_MASK ] = true ;
CUtlString sParamName = GetParameterString ( dwToken , DST_REGISTER , false , NULL ) ;
PrintIndentation ( ( char * ) m_pBufParamCode - > Base ( ) , m_pBufParamCode - > Size ( ) ) ;
PrintToBuf ( * m_pBufParamCode , " vec4 %s = vec4( " , sParamName . String ( ) ) ;
// Run through the 4 floats
for ( int i = 0 ; i < 4 ; i + + )
{
float fConst = uint32ToFloat ( GetNextToken ( ) ) ;
char szTemp [ 1024 ] ;
FloatToString ( szTemp , sizeof ( szTemp ) , fConst ) ;
#if 0
static double flMaxErr1 ;
static double flMaxErr2 ;
// Compare FloatToString()'s results vs. V_snprintf()'s, also track maximum error of each.
double flCheck = atof ( szTemp ) ;
double flErr = fabs ( flCheck - fConst ) ;
flMaxErr1 = MAX ( flMaxErr1 , flErr ) ;
Assert ( EqualTol ( flCheck , fConst , .000000125 ) ) ;
char szTemp2 [ 256 ] ;
V_snprintf ( szTemp2 , sizeof ( szTemp2 ) , " %.12f " , fConst ) ;
StripExtraTrailingZeros ( szTemp2 ) ;
if ( ! strchr ( szTemp2 , ' . ' ) )
{
V_strncat ( szTemp2 , " .0 " , sizeof ( szTemp2 ) ) ;
}
double flCheck2 = atof ( szTemp2 ) ;
double flErr2 = fabs ( flCheck2 - fConst ) ;
flMaxErr2 = MAX ( flMaxErr2 , flErr2 ) ;
Assert ( EqualTol ( flCheck2 , fConst , .000000125 ) ) ;
if ( flMaxErr1 > flMaxErr2 )
{
GLMDebugPrintf ( " ! \n " ) ;
}
# endif
PrintToBuf ( * m_pBufParamCode , i ! = 3 ? " %s, " : " %s " , szTemp ) ; // end with comma-space
}
PrintToBuf ( * m_pBufParamCode , " ); \n " ) ;
}
void D3DToGL : : Handle_MAD ( uint32 nInstruction )
{
uint32 nDestToken = GetNextToken ( ) ;
CUtlString sParam1 = GetParameterString ( nDestToken , DST_REGISTER , false , NULL ) ;
int nARLComp0 = ARL_DEST_NONE ;
CUtlString sParam2 = GetParameterString ( GetNextToken ( ) , SRC_REGISTER , false , & nARLComp0 ) ;
int nARLComp1 = ARL_DEST_NONE ;
CUtlString sParam3 = GetParameterString ( GetNextToken ( ) , SRC_REGISTER , false , & nARLComp1 ) ;
int nARLComp2 = ARL_DEST_NONE ;
CUtlString sParam4 = GetParameterString ( GetNextToken ( ) , SRC_REGISTER , false , & nARLComp2 ) ;
// This optionally inserts a move from our dummy address register to the .x component of the real one
InsertMoveFromAddressRegister ( m_pBufALUCode , nARLComp0 , nARLComp1 , nARLComp2 ) ;
sParam2 = FixGLSLSwizzle ( sParam1 , sParam2 ) ;
sParam3 = FixGLSLSwizzle ( sParam1 , sParam3 ) ;
sParam4 = FixGLSLSwizzle ( sParam1 , sParam4 ) ;
PrintToBufWithIndents ( * m_pBufALUCode , " %s = %s * %s + %s; \n " , sParam1 . String ( ) , sParam2 . String ( ) , sParam3 . String ( ) , sParam4 . String ( ) ) ;
// If the _SAT instruction modifier is used, then do a saturate here.
if ( nDestToken & D3DSPDM_SATURATE )
{
int nComponents = GetNumSwizzleComponents ( sParam1 . String ( ) ) ;
if ( nComponents = = 0 )
nComponents = 4 ;
PrintToBufWithIndents ( * m_pBufALUCode , " %s = clamp( %s, %s, %s ); \n " , sParam1 . String ( ) , sParam1 . String ( ) , g_szVecZeros [ nComponents ] , g_szVecOnes [ nComponents ] ) ;
}
}
void D3DToGL : : Handle_DP2ADD ( )
{
char pDestReg [ 64 ] , pSrc0Reg [ 64 ] , pSrc1Reg [ 64 ] , pSrc2Reg [ 64 ] ;
uint32 nDestToken = GetNextToken ( ) ;
PrintParameterToString ( nDestToken , DST_REGISTER , pDestReg , sizeof ( pDestReg ) , false , NULL ) ;
PrintParameterToString ( GetNextToken ( ) , SRC_REGISTER , pSrc0Reg , sizeof ( pSrc0Reg ) , false , NULL ) ;
PrintParameterToString ( GetNextToken ( ) , SRC_REGISTER , pSrc1Reg , sizeof ( pSrc1Reg ) , false , NULL ) ;
PrintParameterToString ( GetNextToken ( ) , SRC_REGISTER , pSrc2Reg , sizeof ( pSrc2Reg ) , false , NULL ) ;
// We should only be assigning to a single component of the dest.
Assert ( GetNumSwizzleComponents ( pDestReg ) = = 1 ) ;
Assert ( GetNumSwizzleComponents ( pSrc2Reg ) = = 1 ) ;
// This is a 2D dot product, so we only want two entries from the middle components.
CUtlString sArg0 = EnsureNumSwizzleComponents ( pSrc0Reg , 2 ) ;
CUtlString sArg1 = EnsureNumSwizzleComponents ( pSrc1Reg , 2 ) ;
PrintToBufWithIndents ( * m_pBufALUCode , " %s = dot( %s, %s ) + %s; \n " , pDestReg , sArg0 . String ( ) , sArg1 . String ( ) , pSrc2Reg ) ;
// If the _SAT instruction modifier is used, then do a saturate here.
if ( nDestToken & D3DSPDM_SATURATE )
{
int nComponents = GetNumSwizzleComponents ( pDestReg ) ;
if ( nComponents = = 0 )
nComponents = 4 ;
PrintToBufWithIndents ( * m_pBufALUCode , " %s = clamp( %s, %s, %s ); \n " , pDestReg , pDestReg , g_szVecZeros [ nComponents ] , g_szVecOnes [ nComponents ] ) ;
}
}
void D3DToGL : : Handle_SINCOS ( )
{
char pDestReg [ 64 ] , pSrc0Reg [ 64 ] ;
PrintParameterToString ( GetNextToken ( ) , DST_REGISTER , pDestReg , sizeof ( pDestReg ) , false , NULL ) ;
PrintParameterToString ( GetNextToken ( ) , SRC_REGISTER , pSrc0Reg , sizeof ( pSrc0Reg ) , true , NULL ) ;
m_bNeedsSinCosDeclarations = true ;
CUtlString sDest ( pDestReg ) ;
CUtlString sArg0 = EnsureNumSwizzleComponents ( pSrc0Reg , 1 ) ; // Ensure input is scalar
CUtlString sResult ( " vSinCosTmp.xy " ) ; // Always going to populate this
sResult = FixGLSLSwizzle ( sDest , sResult ) ; // Make sure we match the desired output reg
PrintToBufWithIndents ( * m_pBufALUCode , " vSinCosTmp.z = %s * %s; \n " , sArg0 . String ( ) , sArg0 . String ( ) ) ;
PrintToBufWithIndents ( * m_pBufALUCode , " vSinCosTmp.xy = vSinCosTmp.zz * scA.xy + scA.wz; \n " ) ;
PrintToBufWithIndents ( * m_pBufALUCode , " vSinCosTmp.xy = vSinCosTmp.xy * vSinCosTmp.zz + scB.xy; \n " ) ;
PrintToBufWithIndents ( * m_pBufALUCode , " vSinCosTmp.xy = vSinCosTmp.xy * vSinCosTmp.zz + scB.wz; \n " ) ;
PrintToBufWithIndents ( * m_pBufALUCode , " vSinCosTmp.x = vSinCosTmp.x * %s; \n " , sArg0 . String ( ) ) ;
PrintToBufWithIndents ( * m_pBufALUCode , " vSinCosTmp.xy = vSinCosTmp.xy * vSinCosTmp.xx; \n " ) ;
PrintToBufWithIndents ( * m_pBufALUCode , " vSinCosTmp.xy = vSinCosTmp.xy + vSinCosTmp.xy; \n " ) ;
PrintToBufWithIndents ( * m_pBufALUCode , " vSinCosTmp.x = -vSinCosTmp.x + scB.z; \n " ) ;
PrintToBufWithIndents ( * m_pBufALUCode , " %s = %s; \n " , sDest . String ( ) , sResult . String ( ) ) ;
if ( m_dwMajorVersion < 3 )
{
// Eat two more tokens since D3D defines Taylor series constants that we won't need
// Only valid for pixel and vertex shader version earlier than 3_0
// (http://msdn.microsoft.com/en-us/library/windows/hardware/ff569710(v=vs.85).aspx)
SkipTokens ( 2 ) ;
}
}
void D3DToGL : : Handle_LRP ( uint32 nInstruction )
{
uint32 nDestToken = GetNextToken ( ) ;
CUtlString sDest = GetParameterString ( nDestToken , DST_REGISTER , false , NULL ) ;
int nARLComp0 = ARL_DEST_NONE ;
CUtlString sParam0 = GetParameterString ( GetNextToken ( ) , SRC_REGISTER , false , & nARLComp0 ) ;
int nARLComp1 = ARL_DEST_NONE ;
CUtlString sParam1 = GetParameterString ( GetNextToken ( ) , SRC_REGISTER , false , & nARLComp1 ) ;
int nARLComp2 = ARL_DEST_NONE ;
CUtlString sParam2 = GetParameterString ( GetNextToken ( ) , SRC_REGISTER , false , & nARLComp2 ) ;
// This optionally inserts a move from our dummy address register to the .x component of the real one
InsertMoveFromAddressRegister ( m_pBufALUCode , nARLComp0 , nARLComp1 , nARLComp2 ) ;
sParam0 = FixGLSLSwizzle ( sDest , sParam0 ) ;
sParam1 = FixGLSLSwizzle ( sDest , sParam1 ) ;
sParam2 = FixGLSLSwizzle ( sDest , sParam2 ) ;
// dest = src0 * (src1 - src2) + src2;
PrintToBufWithIndents ( * m_pBufALUCode , " %s = %s * ( %s - %s ) + %s; \n " , sDest . String ( ) , sParam0 . String ( ) , sParam1 . String ( ) , sParam2 . String ( ) , sParam2 . String ( ) ) ;
// If the _SAT instruction modifier is used, then do a saturate here.
if ( nDestToken & D3DSPDM_SATURATE )
{
int nComponents = GetNumSwizzleComponents ( sDest . String ( ) ) ;
if ( nComponents = = 0 )
nComponents = 4 ;
PrintToBufWithIndents ( * m_pBufALUCode , " %s = clamp( %s, %s, %s ); \n " , sDest . String ( ) , sDest . String ( ) , g_szVecZeros [ nComponents ] , g_szVecOnes [ nComponents ] ) ;
}
}
void D3DToGL : : Handle_TEX ( uint32 dwToken , bool bIsTexLDL )
{
char pDestReg [ 64 ] , pSrc0Reg [ 64 ] , pSrc1Reg [ 64 ] ;
PrintParameterToString ( GetNextToken ( ) , DST_REGISTER , pDestReg , sizeof ( pDestReg ) , false , NULL ) ;
PrintParameterToString ( GetNextToken ( ) , SRC_REGISTER , pSrc0Reg , sizeof ( pSrc0Reg ) , false , NULL ) ;
DWORD dwSrc1Token = GetNextToken ( ) ;
PrintParameterToString ( dwSrc1Token , SRC_REGISTER , pSrc1Reg , sizeof ( pSrc1Reg ) , false , NULL ) ;
Assert ( ( dwSrc1Token & D3DSP_REGNUM_MASK ) < ARRAYSIZE ( m_dwSamplerTypes ) ) ;
uint32 nSamplerType = m_dwSamplerTypes [ dwSrc1Token & D3DSP_REGNUM_MASK ] ;
if ( nSamplerType = = SAMPLER_TYPE_2D )
{
const bool bIsShadowSampler = ( ( 1 < < ( ( int ) ( dwSrc1Token & D3DSP_REGNUM_MASK ) ) ) & m_nShadowDepthSamplerMask ) ! = 0 ;
if ( bIsTexLDL )
{
CUtlString sCoordVar = EnsureNumSwizzleComponents ( pSrc0Reg , bIsShadowSampler ? 3 : 2 ) ;
// Strip out the W component of the pSrc0Reg and pass that as the LOD to texture2DLod.
char szLOD [ 128 ] , szExtra [ 8 ] ;
GetParamNameWithoutSwizzle ( pSrc0Reg , szLOD , sizeof ( szLOD ) ) ;
V_snprintf ( szExtra , sizeof ( szExtra ) , " .%c " , GetSwizzleComponent ( pSrc0Reg , 3 ) ) ;
V_strncat ( szLOD , szExtra , sizeof ( szLOD ) ) ;
PrintToBufWithIndents ( * m_pBufALUCode , " %s = %s( %s, %s, %s ); \n " , pDestReg , bIsShadowSampler ? " shadow2DLod " : " textureLod " , pSrc1Reg , sCoordVar . String ( ) , szLOD ) ;
}
else if ( bIsShadowSampler )
{
// .z is meant to contain the object depth, while .xy contains the 2D tex coords
CUtlString sCoordVar3D = EnsureNumSwizzleComponents ( pSrc0Reg , 3 ) ;
PrintToBufWithIndents ( * m_pBufALUCode , " %s = shadow2D( %s, %s ); \n " , pDestReg , pSrc1Reg , sCoordVar3D . String ( ) ) ;
Assert ( m_dwSamplerTypes [ dwSrc1Token & D3DSP_REGNUM_MASK ] = = SAMPLER_TYPE_2D ) ;
}
else if ( ( OpcodeSpecificData ( dwToken ) < < D3DSP_OPCODESPECIFICCONTROL_SHIFT ) = = D3DSI_TEXLD_PROJECT )
{
// This projective case is after the shadow case intentionally, due to the way that "projective"
// loads are overloaded in our D3D shaders for shadow lookups.
//
// We use the vec4 variant of texture2DProj() intentionally here, since it lines up well with Direct3D.
CUtlString s4DProjCoords = EnsureNumSwizzleComponents ( pSrc0Reg , 4 ) ; // Ensure vec4 variant
PrintToBufWithIndents ( * m_pBufALUCode , " %s = textureProj( %s, %s ); \n " , pDestReg , pSrc1Reg , s4DProjCoords . String ( ) ) ;
}
else
{
CUtlString sCoordVar = EnsureNumSwizzleComponents ( pSrc0Reg , bIsShadowSampler ? 3 : 2 ) ;
PrintToBufWithIndents ( * m_pBufALUCode , " %s = texture( %s, %s ); \n " , pDestReg , pSrc1Reg , sCoordVar . String ( ) ) ;
}
}
else if ( nSamplerType = = SAMPLER_TYPE_3D )
{
if ( bIsTexLDL )
{
TranslationError ( ) ;
}
CUtlString sCoordVar = EnsureNumSwizzleComponents ( pSrc0Reg , 3 ) ;
PrintToBufWithIndents ( * m_pBufALUCode , " %s = texture( %s, %s ); \n " , pDestReg , pSrc1Reg , sCoordVar . String ( ) ) ;
}
else if ( nSamplerType = = SAMPLER_TYPE_CUBE )
{
if ( bIsTexLDL )
{
TranslationError ( ) ;
}
CUtlString sCoordVar = EnsureNumSwizzleComponents ( pSrc0Reg , 3 ) ;
PrintToBufWithIndents ( * m_pBufALUCode , " %s = texture( %s, %s ); \n " , pDestReg , pSrc1Reg , sCoordVar . String ( ) ) ;
}
else
{
Error ( " TEX instruction: unsupported sampler type used " ) ;
}
}
void D3DToGL : : StrcatToHeaderCode ( const char * pBuf )
{
strcat_s ( ( char * ) m_pBufHeaderCode - > Base ( ) , m_pBufHeaderCode - > Size ( ) , pBuf ) ;
}
void D3DToGL : : StrcatToALUCode ( const char * pBuf )
{
PrintIndentation ( ( char * ) m_pBufALUCode - > Base ( ) , m_pBufALUCode - > Size ( ) ) ;
strcat_s ( ( char * ) m_pBufALUCode - > Base ( ) , m_pBufALUCode - > Size ( ) , pBuf ) ;
}
void D3DToGL : : StrcatToParamCode ( const char * pBuf )
{
strcat_s ( ( char * ) m_pBufParamCode - > Base ( ) , m_pBufParamCode - > Size ( ) , pBuf ) ;
}
void D3DToGL : : StrcatToAttribCode ( const char * pBuf )
{
strcat_s ( ( char * ) m_pBufAttribCode - > Base ( ) , m_pBufAttribCode - > Size ( ) , pBuf ) ;
}
void D3DToGL : : Handle_TexLDD ( uint32 nInstruction )
{
TranslationError ( ) ; // Not supported yet, but can be if we need it.
}
void D3DToGL : : Handle_TexCoord ( )
{
TranslationError ( ) ;
// If ps_1_4, this is texcrd
if ( ( m_dwMajorVersion = = 1 ) & & ( m_dwMinorVersion = = 4 ) & & ( ! m_bVertexShader ) )
{
StrcatToALUCode ( " texcrd " ) ;
}
else // else it's texcoord
{
TranslationError ( ) ;
StrcatToALUCode ( " texcoord " ) ;
}
char buff [ 256 ] ;
PrintParameterToString ( GetNextToken ( ) , DST_REGISTER , buff , sizeof ( buff ) , false , NULL ) ;
StrcatToALUCode ( buff ) ;
// If ps_1_4, texcrd also has a source parameter
if ( ( m_dwMajorVersion = = 1 ) & & ( m_dwMinorVersion = = 4 ) & & ( ! m_bVertexShader ) )
{
StrcatToALUCode ( " , " ) ;
PrintParameterToString ( GetNextToken ( ) , SRC_REGISTER , buff , sizeof ( buff ) , false , NULL ) ;
StrcatToALUCode ( buff ) ;
}
StrcatToALUCode ( " ; \n " ) ;
}
void D3DToGL : : Handle_BREAKC ( uint32 dwToken )
{
uint nComparison = ( dwToken & D3DSHADER_COMPARISON_MASK ) > > D3DSHADER_COMPARISON_SHIFT ;
const char * pComparison = " ? " ;
switch ( nComparison )
{
case D3DSPC_GT : pComparison = " > " ; break ;
case D3DSPC_EQ : pComparison = " == " ; break ;
case D3DSPC_GE : pComparison = " >= " ; break ;
case D3DSPC_LT : pComparison = " < " ; break ;
case D3DSPC_NE : pComparison = " != " ; break ;
case D3DSPC_LE : pComparison = " <= " ; break ;
default :
TranslationError ( ) ;
}
char src0 [ 256 ] ;
uint32 src0Token = GetNextToken ( ) ;
PrintParameterToString ( src0Token , SRC_REGISTER , src0 , sizeof ( src0 ) , false , NULL ) ;
char src1 [ 256 ] ;
uint32 src1Token = GetNextToken ( ) ;
PrintParameterToString ( src1Token , SRC_REGISTER , src1 , sizeof ( src1 ) , false , NULL ) ;
PrintToBufWithIndents ( * m_pBufALUCode , " if (%s %s %s) break; \n " , src0 , pComparison , src1 ) ;
}
void D3DToGL : : HandleBinaryOp_GLSL ( uint32 nInstruction )
{
uint32 nDestToken = GetNextToken ( ) ;
CUtlString sParam1 = GetParameterString ( nDestToken , DST_REGISTER , false , NULL ) ;
int nARLComp0 = ARL_DEST_NONE ;
CUtlString sParam2 = GetParameterString ( GetNextToken ( ) , SRC_REGISTER , false , & nARLComp0 ) ;
int nARLComp1 = ARL_DEST_NONE ;
CUtlString sParam3 = GetParameterString ( GetNextToken ( ) , SRC_REGISTER , false , & nARLComp1 ) ;
// This optionally inserts a move from our dummy address register to the .x component of the real one
InsertMoveFromAddressRegister ( m_pBufALUCode , nARLComp0 , nARLComp1 ) ;
// Since DP3 and DP4 have a scalar as the dest and vectors as the src, don't screw with the swizzle specifications.
if ( nInstruction = = D3DSIO_DP3 )
{
sParam2 = EnsureNumSwizzleComponents ( sParam2 , 3 ) ;
sParam3 = EnsureNumSwizzleComponents ( sParam3 , 3 ) ;
}
else if ( nInstruction = = D3DSIO_DP4 )
{
sParam2 = EnsureNumSwizzleComponents ( sParam2 , 4 ) ;
sParam3 = EnsureNumSwizzleComponents ( sParam3 , 4 ) ;
}
else if ( nInstruction = = D3DSIO_DST )
{
m_bUsesDSTInstruction = true ;
sParam2 = EnsureNumSwizzleComponents ( sParam2 , 4 ) ;
sParam3 = EnsureNumSwizzleComponents ( sParam3 , 4 ) ;
}
else
{
sParam2 = FixGLSLSwizzle ( sParam1 , sParam2 ) ;
sParam3 = FixGLSLSwizzle ( sParam1 , sParam3 ) ;
}
char buff [ 256 ] ;
if ( nInstruction = = D3DSIO_ADD | | nInstruction = = D3DSIO_SUB | | nInstruction = = D3DSIO_MUL )
{
// These all look like x = y op z
PrintToBufWithIndents ( * m_pBufALUCode , " %s = %s %s %s; \n " , sParam1 . String ( ) , sParam2 . String ( ) , GetGLSLOperatorString ( nInstruction ) , sParam3 . String ( ) ) ;
}
else
{
int nDestComponents = GetNumSwizzleComponents ( sParam1 . String ( ) ) ;
int nSrcComponents = GetNumSwizzleComponents ( sParam2 . String ( ) ) ;
// All remaining instructions can use GLSL intrinsics like dot() and cross().
bool bDoubleClose = OpenIntrinsic ( nInstruction , buff , sizeof ( buff ) , nDestComponents , nSrcComponents ) ;
if ( ( nSrcComponents = = 1 ) & & ( nInstruction = = D3DSIO_SGE ) )
{
PrintToBufWithIndents ( * m_pBufALUCode , " %s = %s%s >= %s ); \n " , sParam1 . String ( ) , buff , sParam2 . String ( ) , sParam3 . String ( ) ) ;
}
else if ( ( nSrcComponents = = 1 ) & & ( nInstruction = = D3DSIO_SLT ) )
{
PrintToBufWithIndents ( * m_pBufALUCode , " %s = %s%s < %s ); \n " , sParam1 . String ( ) , buff , sParam2 . String ( ) , sParam3 . String ( ) ) ;
}
else
{
PrintToBufWithIndents ( * m_pBufALUCode , " %s = %s%s, %s %s; \n " , sParam1 . String ( ) , buff , sParam2 . String ( ) , sParam3 . String ( ) , bDoubleClose ? " ) ) " : " ) " ) ;
}
}
// If the _SAT instruction modifier is used, then do a saturate here.
if ( nDestToken & D3DSPDM_SATURATE )
{
int nComponents = GetNumSwizzleComponents ( sParam1 . String ( ) ) ;
if ( nComponents = = 0 )
nComponents = 4 ;
PrintToBufWithIndents ( * m_pBufALUCode , " %s = clamp( %s, %s, %s ); \n " , sParam1 . String ( ) , sParam1 . String ( ) , g_szVecZeros [ nComponents ] , g_szVecOnes [ nComponents ] ) ;
}
}
void D3DToGL : : HandleBinaryOp_ASM ( uint32 nInstruction )
{
CUtlString sParam1 = GetParameterString ( GetNextToken ( ) , DST_REGISTER , false , NULL ) ;
int nARLComp0 = ARL_DEST_NONE ;
CUtlString sParam2 = GetParameterString ( GetNextToken ( ) , SRC_REGISTER , false , & nARLComp0 ) ;
int nARLComp1 = ARL_DEST_NONE ;
CUtlString sParam3 = GetParameterString ( GetNextToken ( ) , SRC_REGISTER , false , & nARLComp1 ) ;
// This optionally inserts a move from our dummy address register to the .x component of the real one
InsertMoveFromAddressRegister ( m_pBufALUCode , nARLComp0 , nARLComp1 ) ;
char buff [ 256 ] ;
PrintOpcode ( nInstruction , buff , sizeof ( buff ) ) ;
PrintToBufWithIndents ( * m_pBufALUCode , " %s%s, %s, %s; \n " , buff , sParam1 . String ( ) , sParam2 . String ( ) , sParam3 . String ( ) ) ;
}
void D3DToGL : : WriteGLSLCmp ( const char * pDestReg , const char * pSrc0Reg , const char * pSrc1Reg , const char * pSrc2Reg )
{
int nWriteMaskEntries = GetNumWriteMaskEntries ( pDestReg ) ;
for ( int i = 0 ; i < nWriteMaskEntries ; i + + )
{
char params [ 4 ] [ 256 ] ;
WriteParamWithSingleMaskEntry ( pDestReg , i , params [ 0 ] , sizeof ( params [ 0 ] ) ) ;
WriteParamWithSingleMaskEntry ( pSrc0Reg , i , params [ 1 ] , sizeof ( params [ 1 ] ) ) ;
WriteParamWithSingleMaskEntry ( pSrc1Reg , i , params [ 2 ] , sizeof ( params [ 2 ] ) ) ;
WriteParamWithSingleMaskEntry ( pSrc2Reg , i , params [ 3 ] , sizeof ( params [ 3 ] ) ) ;
PrintToBufWithIndents ( * m_pBufALUCode , " %s = ( %s >= 0.0 ) ? %s : %s; \n " , params [ 0 ] , params [ 1 ] , params [ 2 ] , params [ 3 ] ) ;
}
}
void D3DToGL : : Handle_CMP ( )
{
// In Direct3D, result = (src0 >= 0.0) ? src1 : src2
// In OpenGL, result = (src0 < 0.0) ? src1 : src2
//
// As a result, arguments are effectively in a different order than Direct3D! !#$&*!%#$&
char pDestReg [ 64 ] , pSrc0Reg [ 64 ] , pSrc1Reg [ 64 ] , pSrc2Reg [ 64 ] ;
uint32 nDestToken = GetNextToken ( ) ;
PrintParameterToString ( nDestToken , DST_REGISTER , pDestReg , sizeof ( pDestReg ) , false , NULL ) ;
PrintParameterToString ( GetNextToken ( ) , SRC_REGISTER , pSrc0Reg , sizeof ( pSrc0Reg ) , false , NULL ) ;
PrintParameterToString ( GetNextToken ( ) , SRC_REGISTER , pSrc1Reg , sizeof ( pSrc1Reg ) , false , NULL ) ;
PrintParameterToString ( GetNextToken ( ) , SRC_REGISTER , pSrc2Reg , sizeof ( pSrc2Reg ) , false , NULL ) ;
// These are a tricky case.. we have to expand it out into multiple statements.
char szDestBase [ 256 ] ;
GetParamNameWithoutSwizzle ( pDestReg , szDestBase , sizeof ( szDestBase ) ) ;
V_strncpy ( pSrc0Reg , FixGLSLSwizzle ( pDestReg , pSrc0Reg ) , sizeof ( pSrc0Reg ) ) ;
V_strncpy ( pSrc1Reg , FixGLSLSwizzle ( pDestReg , pSrc1Reg ) , sizeof ( pSrc1Reg ) ) ;
V_strncpy ( pSrc2Reg , FixGLSLSwizzle ( pDestReg , pSrc2Reg ) , sizeof ( pSrc2Reg ) ) ;
// This isn't reliable!
//if ( DoParamNamesMatch( pDestReg, pSrc0Reg ) && GetNumSwizzleComponents( pDestReg ) > 1 )
if ( 1 )
{
// So the dest register is the same as the comparand. We're in danger of screwing up our results.
//
// For example, this code:
// CMP r0.xy, r0.xx, r1, r2
// would generate this:
// r0.x = (r0.x >= 0) ? r1.x : r2.x;
// r0.y = (r0.x >= 0) ? r1.x : r2.x;
//
// But the first lines changes r0.x and thus screws the atomicity of the CMP instruction for the second line.
// So we assign r0 to a temporary first and then write to the temporary.
PrintToBufWithIndents ( * m_pBufALUCode , " %s = %s; \n " , g_pAtomicTempVarName , szDestBase ) ;
char szTempVar [ 256 ] ;
ReplaceParamName ( pDestReg , g_pAtomicTempVarName , szTempVar , sizeof ( szTempVar ) ) ;
WriteGLSLCmp ( szTempVar , pSrc0Reg , pSrc1Reg , pSrc2Reg ) ;
PrintToBufWithIndents ( * m_pBufALUCode , " %s = %s; \n " , szDestBase , g_pAtomicTempVarName ) ;
m_bUsedAtomicTempVar = true ;
}
else
{
// Just write out the simple expanded version of the CMP. No need to use atomic_temp_var.
WriteGLSLCmp ( pDestReg , pSrc0Reg , pSrc1Reg , pSrc2Reg ) ;
}
// If the _SAT instruction modifier is used, then do a saturate here.
if ( nDestToken & D3DSPDM_SATURATE )
{
int nComponents = GetNumSwizzleComponents ( pDestReg ) ;
if ( nComponents = = 0 )
nComponents = 4 ;
PrintToBufWithIndents ( * m_pBufALUCode , " %s = clamp( %s, %s, %s ); \n " , pDestReg , pDestReg , g_szVecZeros [ nComponents ] , g_szVecOnes [ nComponents ] ) ;
}
}
void D3DToGL : : Handle_NRM ( )
{
char pDestReg [ 64 ] ;
char pSrc0Reg [ 64 ] ;
PrintParameterToString ( GetNextToken ( ) , DST_REGISTER , pDestReg , sizeof ( pDestReg ) , false , NULL ) ;
int nARLSrcComp = ARL_DEST_NONE ;
PrintParameterToString ( GetNextToken ( ) , SRC_REGISTER , pSrc0Reg , sizeof ( pSrc0Reg ) , false , & nARLSrcComp ) ;
if ( nARLSrcComp ! = - 1 )
{
InsertMoveFromAddressRegister ( m_pBufALUCode , nARLSrcComp , - 1 , - 1 ) ;
}
CUtlString sSrc = EnsureNumSwizzleComponents ( pSrc0Reg , 3 ) ;
PrintToBufWithIndents ( * m_pBufALUCode , " %s = normalize( %s ); \n " , pDestReg , sSrc . String ( ) ) ;
}
void D3DToGL : : Handle_UnaryOp ( uint32 nInstruction )
{
uint32 nDestToken = GetNextToken ( ) ;
CUtlString sParam1 = GetParameterString ( nDestToken , DST_REGISTER , false , NULL ) ;
CUtlString sParam2 = GetParameterString ( GetNextToken ( ) , SRC_REGISTER , false , NULL ) ;
sParam2 = FixGLSLSwizzle ( sParam1 , sParam2 ) ;
if ( nInstruction = = D3DSIO_MOV )
{
PrintToBufWithIndents ( * m_pBufALUCode , " %s = %s; \n " , sParam1 . String ( ) , sParam2 . String ( ) ) ;
}
else if ( nInstruction = = D3DSIO_RSQ )
{
PrintToBufWithIndents ( * m_pBufALUCode , " %s = inversesqrt( %s ); \n " , sParam1 . String ( ) , sParam2 . String ( ) ) ;
}
else if ( nInstruction = = D3DSIO_RCP )
{
PrintToBufWithIndents ( * m_pBufALUCode , " %s = 1.0 / %s; \n " , sParam1 . String ( ) , sParam2 . String ( ) ) ;
}
else if ( nInstruction = = D3DSIO_EXP )
{
PrintToBufWithIndents ( * m_pBufALUCode , " %s = exp2( %s ); \n " , sParam1 . String ( ) , sParam2 . String ( ) ) ;
}
else if ( nInstruction = = D3DSIO_FRC )
{
PrintToBufWithIndents ( * m_pBufALUCode , " %s = fract( %s ); \n " , sParam1 . String ( ) , sParam2 . String ( ) ) ;
}
else if ( nInstruction = = D3DSIO_LOG ) // d3d 'log' is log base 2
{
PrintToBufWithIndents ( * m_pBufALUCode , " %s = log2( %s ); \n " , sParam1 . String ( ) , sParam2 . String ( ) ) ;
}
else if ( nInstruction = = D3DSIO_ABS ) // rbarris did this one, Jason please check
{
PrintToBufWithIndents ( * m_pBufALUCode , " %s = abs( %s ); \n " , sParam1 . String ( ) , sParam2 . String ( ) ) ;
}
else if ( nInstruction = = D3DSIO_MOVA )
{
m_bDeclareAddressReg = true ;
PrintToBufWithIndents ( * m_pBufALUCode , " %s = %s; \n " , sParam1 . String ( ) , sParam2 . String ( ) ) ;
if ( ! m_bGenerateBoneUniformBuffer )
{
m_nHighestRegister = DXABSTRACT_VS_PARAM_SLOTS - 1 ;
}
}
else
{
Error ( " Unsupported instruction " ) ;
}
// If the _SAT instruction modifier is used, then do a saturate here.
if ( nDestToken & D3DSPDM_SATURATE )
{
int nComponents = GetNumSwizzleComponents ( sParam1 . String ( ) ) ;
if ( nComponents = = 0 )
{
nComponents = 4 ;
}
PrintToBufWithIndents ( * m_pBufALUCode , " %s = clamp( %s, %s, %s ); \n " , sParam1 . String ( ) , sParam1 . String ( ) , g_szVecZeros [ nComponents ] , g_szVecOnes [ nComponents ] ) ;
}
}
void D3DToGL : : WriteGLSLSamplerDefinitions ( )
{
int nSamplersWritten = 0 ;
bool m_bSampler3d = false ;
for ( int i = 0 ; i < ARRAYSIZE ( m_dwSamplerTypes ) ; i + + )
{
if ( m_dwSamplerTypes [ i ] = = SAMPLER_TYPE_2D )
{
if ( ( ( 1 < < i ) & m_nShadowDepthSamplerMask ) ! = 0 )
{
PrintToBuf ( * m_pBufHeaderCode , " uniform sampler2D sampler%d; \n " , i ) ;
}
else
{
PrintToBuf ( * m_pBufHeaderCode , " uniform sampler2D sampler%d; \n " , i ) ;
}
+ + nSamplersWritten ;
}
else if ( m_dwSamplerTypes [ i ] = = SAMPLER_TYPE_3D )
{
if ( ! m_bSampler3d )
{
StrcatToHeaderCode ( " precision mediump sampler3D; \n " ) ;
m_bSampler3d = true ;
}
PrintToBuf ( * m_pBufHeaderCode , " uniform sampler3D sampler%d; \n " , i ) ;
+ + nSamplersWritten ;
}
else if ( m_dwSamplerTypes [ i ] = = SAMPLER_TYPE_CUBE )
{
PrintToBuf ( * m_pBufHeaderCode , " uniform samplerCube sampler%d; \n " , i ) ;
+ + nSamplersWritten ;
}
else if ( m_dwSamplerTypes [ i ] ! = SAMPLER_TYPE_UNUSED )
{
Error ( " Unknown sampler type. " ) ;
}
}
if ( nSamplersWritten > 0 )
PrintToBuf ( * m_pBufHeaderCode , " \n \n " ) ;
}
void D3DToGL : : WriteGLSLOutputVariableAssignments ( )
{
if ( m_bVertexShader )
{
// Map output "oN" registers back to GLSL output variables.
if ( m_bAddHexCodeComments )
{
PrintToBuf ( * m_pBufAttribCode , " \n // Now we're storing the oN variables from the output dcl_ statements back into their GLSL equivalents. \n " ) ;
}
for ( int i = 0 ; i < ARRAYSIZE ( m_DeclaredOutputs ) ; i + + )
{
if ( m_DeclaredOutputs [ i ] = = UNDECLARED_OUTPUT )
continue ;
if ( ( m_dwTexCoordOutMask & ( 1 < < i ) ) = = 0 )
continue ;
uint32 dwToken = m_DeclaredOutputs [ i ] ;
uint32 dwUsage = ( dwToken & D3DSP_DCL_USAGE_MASK ) ;
uint32 dwUsageIndex = ( dwToken & D3DSP_DCL_USAGEINDEX_MASK ) > > D3DSP_DCL_USAGEINDEX_SHIFT ;
if ( ( dwUsage = = D3DDECLUSAGE_FOG ) | | ( dwUsage = = D3DDECLUSAGE_PSIZE ) )
{
TranslationError ( ) ; // Not supported yet, but can be if we need it.
}
if ( dwUsage = = D3DDECLUSAGE_COLOR )
{
if ( ! m_bFrontColor )
{
StrcatToHeaderCode ( " varying lowp vec4 _gl_FrontColor; \n " ) ;
m_bFrontColor = true ;
}
PrintToBufWithIndents ( * m_pBufALUCode , " %s = oTempT%d; \n " , dwUsageIndex ? " gl_FrontSecondaryColor " : " _gl_FrontColor " , i ) ;
}
else if ( dwUsage = = D3DDECLUSAGE_TEXCOORD )
{
char buf [ 256 ] ;
if ( m_nCentroidMask & ( 0x00000001 < < dwUsageIndex ) )
{
V_snprintf ( buf , sizeof ( buf ) , " centroid out vec4 oT%d; \n " , dwUsageIndex ) ; // centroid varying
}
else
{
V_snprintf ( buf , sizeof ( buf ) , " out vec4 oT%d; \n " , dwUsageIndex ) ;
}
StrcatToHeaderCode ( buf ) ;
PrintToBufWithIndents ( * m_pBufALUCode , " oT%d = oTempT%d; \n " , dwUsageIndex , i ) ;
}
}
}
}
void D3DToGL : : WriteGLSLInputVariableAssignments ( )
{
if ( m_bVertexShader )
return ;
for ( int i = 0 ; i < ARRAYSIZE ( m_DeclaredInputs ) ; i + + )
{
if ( m_DeclaredInputs [ i ] = = UNDECLARED_INPUT )
continue ;
uint32 dwToken = m_DeclaredInputs [ i ] ;
uint32 dwUsage = ( dwToken & D3DSP_DCL_USAGE_MASK ) ;
uint32 dwUsageIndex = ( dwToken & D3DSP_DCL_USAGEINDEX_MASK ) > > D3DSP_DCL_USAGEINDEX_SHIFT ;
if ( dwUsage = = D3DDECLUSAGE_COLOR )
{
PrintToBufWithIndents ( * m_pBufAttribCode , " vec4 oTempT%d = %s; \n " , i , dwUsageIndex ? " _gl_FrontSecondaryColor " : " _gl_FrontColor " ) ;
}
else if ( dwUsage = = D3DDECLUSAGE_TEXCOORD )
{
PrintToBufWithIndents ( * m_pBufAttribCode , " vec4 oTempT%d = oT%d; \n " , i , dwUsageIndex ) ;
}
}
}
void D3DToGL : : Handle_DeclarativeNonDclOp ( uint32 nInstruction )
{
char buff [ 128 ] ;
uint32 dwToken = GetNextToken ( ) ;
PrintParameterToString ( dwToken , DST_REGISTER , buff , sizeof ( buff ) , false , NULL ) ;
if ( nInstruction = = D3DSIO_TEXKILL )
{
// TEXKILL is supposed to discard the pixel if any of the src register's X, Y, or Z components are less than zero.
// We have to translate it to something like:
// if ( r0.x < 0.0 || r0.y < 0.0 )
// discard;
char c [ 3 ] ;
c [ 0 ] = GetSwizzleComponent ( buff , 0 ) ;
c [ 1 ] = GetSwizzleComponent ( buff , 1 ) ;
c [ 2 ] = GetSwizzleComponent ( buff , 2 ) ;
// Get the unique components.
char cUnique [ 3 ] ;
cUnique [ 0 ] = c [ 0 ] ;
int nUnique = 1 ;
if ( c [ 1 ] ! = c [ 0 ] )
cUnique [ nUnique + + ] = c [ 1 ] ;
if ( c [ 2 ] ! = c [ 1 ] & & c [ 2 ] ! = c [ 0 ] )
cUnique [ nUnique + + ] = c [ 2 ] ;
// Get the src register base name.
char szBase [ 256 ] ;
GetParamNameWithoutSwizzle ( buff , szBase , sizeof ( szBase ) ) ;
PrintToBufWithIndents ( * m_pBufALUCode , " if ( %s.%c < 0.0 " , szBase , cUnique [ 0 ] ) ;
for ( int i = 1 ; i < nUnique ; i + + )
{
PrintToBuf ( * m_pBufALUCode , " || %s.%c < 0.0 " , szBase , cUnique [ i ] ) ;
}
PrintToBuf ( * m_pBufALUCode , " ) \n { \n \t discard; \n } \n " ) ;
}
else
{
char szOpcode [ 128 ] ;
PrintOpcode ( nInstruction , szOpcode , sizeof ( szOpcode ) ) ;
StrcatToALUCode ( szOpcode ) ;
StrcatToALUCode ( buff ) ;
StrcatToALUCode ( " ; \n " ) ;
}
}
void D3DToGL : : NoteTangentInputUsed ( )
{
if ( ! m_bTangentInputUsed )
{
m_bTangentInputUsed = true ;
// PrintToBuf( *m_pBufParamCode, "attribute vec4 %s;\n", g_pTangentAttributeName );
}
}
// These are the only ARL instructions that should appear in the instruction stream
void D3DToGL : : InsertMoveInstruction ( CUtlBuffer * pCode , int nARLComponent )
{
PrintIndentation ( ( char * ) pCode - > Base ( ) , pCode - > Size ( ) ) ;
switch ( nARLComponent )
{
case ARL_DEST_X :
strcat_s ( ( char * ) pCode - > Base ( ) , pCode - > Size ( ) , " a0 = int( va_r.x ); \n " ) ;
break ;
case ARL_DEST_Y :
strcat_s ( ( char * ) pCode - > Base ( ) , pCode - > Size ( ) , " a0 = int( va_r.y ); \n " ) ;
break ;
case ARL_DEST_Z :
strcat_s ( ( char * ) pCode - > Base ( ) , pCode - > Size ( ) , " a0 = int( va_r.z ); \n " ) ;
break ;
case ARL_DEST_W :
strcat_s ( ( char * ) pCode - > Base ( ) , pCode - > Size ( ) , " a0 = int( va_r.w ); \n " ) ;
break ;
}
}
// This optionally inserts a move from our dummy address register to the .x component of the real one
void D3DToGL : : InsertMoveFromAddressRegister ( CUtlBuffer * pCode , int nARLComp0 , int nARLComp1 , int nARLComp2 /* = ARL_DEST_NONE */ )
{
// We no longer need to do this in GLSL - we put the cast to int from the dummy address register va_r.x, va_r.y, etc. directly into the instruction
return ;
}
//------------------------------------------------------------------------------
// TranslateShader()
//
// This is the main function that the outside world sees. A pointer to the
// uint32 stream returned from the D3DX compile routine is parsed and used
// to write human-readable asm code into the character array pointed to by
// pDisassembledCode. An error code is returned.
//------------------------------------------------------------------------------
int D3DToGL : : TranslateShader ( uint32 * code , CUtlBuffer * pBufDisassembledCode , bool * bVertexShader , uint32 options , int32 nShadowDepthSamplerMask , uint32 nCentroidMask , char * debugLabel )
{
CUtlString sLine , sParamName ;
uint32 i , dwToken , nInstruction , nNumTokensToSkip ;
char buff [ 256 ] ;
// obey options
m_bUseEnvParams = ( options & D3DToGL_OptionUseEnvParams ) ! = 0 ;
m_bDoFixupZ = ( options & D3DToGL_OptionDoFixupZ ) ! = 0 ;
m_bDoFixupY = ( options & D3DToGL_OptionDoFixupY ) ! = 0 ;
m_bDoUserClipPlanes = ( options & D3DToGL_OptionDoUserClipPlanes ) ! = 0 ;
m_bFrontSecondaryColor = false ;
m_bFogFragCoord = false ;
m_bColor = false ;
m_bFrontColor = false ;
m_bSecondaryColor = false ;
m_iFragDataCount = 0 ;
m_bAddHexCodeComments = ( options & D3DToGL_AddHexComments ) ! = 0 ;
m_bPutHexCodesAfterLines = ( options & D3DToGL_PutHexCommentsAfterLines ) ! = 0 ;
m_bGeneratingDebugText = ( options & D3DToGL_GeneratingDebugText ) ! = 0 ;
m_bGenerateSRGBWriteSuffix = ( options & D3DToGL_OptionSRGBWriteSuffix ) ! = 0 ;
// m_bGenerateSRGBWriteSuffix = true;
if ( debugLabel & & ( V_strstr ( debugLabel , " vertexlit_and_unlit_generic_bump_ps " ) ) )
m_bGenerateSRGBWriteSuffix = true ;
m_NumIndentTabs = 1 ; // start code indented one tab
m_nLoopDepth = 0 ;
// debugging
m_bSpew = ( options & D3DToGL_OptionSpew ) ! = 0 ;
// These are not accessed below in a way that will cause them to glow, so
// we could overflow these and/or the buffer pointed to by pDisassembledCode
m_pBufAttribCode = new CUtlBuffer ( 100 , 10000 , CUtlBuffer : : TEXT_BUFFER ) ;
m_pBufParamCode = new CUtlBuffer ( 100 , 10000 , CUtlBuffer : : TEXT_BUFFER ) ;
m_pBufALUCode = new CUtlBuffer ( 100 , 60000 , CUtlBuffer : : TEXT_BUFFER ) ;
// Pointers to text buffers for assembling sections of the program
m_pBufHeaderCode = pBufDisassembledCode ;
char * pAttribMapStart = NULL ;
( ( char * ) m_pBufHeaderCode - > Base ( ) ) [ 0 ] = 0 ;
( ( char * ) m_pBufAttribCode - > Base ( ) ) [ 0 ] = 0 ;
( ( char * ) m_pBufParamCode - > Base ( ) ) [ 0 ] = 0 ;
( ( char * ) m_pBufALUCode - > Base ( ) ) [ 0 ] = 0 ;
for ( i = 0 ; i < MAX_SHADER_CONSTANTS ; i + + )
{
m_bConstantRegisterDefined [ i ] = false ;
}
// Track shadow sampler usage for proper declaration
m_nShadowDepthSamplerMask = nShadowDepthSamplerMask ;
m_bDeclareShadowOption = false ;
// Various flags set while parsing code to drive various declaration instructions
m_bNeedsD2AddTemp = false ;
m_bNeedsLerpTemp = false ;
m_bNeedsNRMTemp = false ;
m_bNeedsSinCosDeclarations = false ;
m_bDeclareAddressReg = false ;
m_bDeclareVSOPos = false ;
m_bDeclareVSOFog = false ;
m_dwTexCoordOutMask = 0x00000000 ;
m_nVSPositionOutput = - 1 ;
m_bOutputColorRegister [ 0 ] = false ;
m_bOutputColorRegister [ 1 ] = false ;
m_bOutputColorRegister [ 2 ] = false ;
m_bOutputColorRegister [ 3 ] = false ;
m_bOutputDepthRegister = false ;
m_bTangentInputUsed = false ;
m_bUsesDSTInstruction = false ;
m_dwTempUsageMask = 0x00000000 ;
m_dwSamplerUsageMask = 0x00000000 ;
m_dwConstIntUsageMask = 0x00000000 ;
m_dwDefConstIntUsageMask = 0x00000000 ;
memset ( m_dwDefConstIntIterCount , 0 , sizeof ( m_dwDefConstIntIterCount ) ) ;
m_dwConstBoolUsageMask = 0x00000000 ;
m_nCentroidMask = nCentroidMask ;
m_nHighestRegister = 0 ;
m_nHighestBoneRegister = - 1 ;
m_bGenerateBoneUniformBuffer = false ;
m_bUseBindlessTexturing = ( ( options & D3DToGL_OptionUseBindlessTexturing ) ! = 0 ) ;
m_bUsedAtomicTempVar = false ;
for ( int i = 0 ; i < ARRAYSIZE ( m_dwSamplerTypes ) ; i + + )
{
m_dwSamplerTypes [ i ] = SAMPLER_TYPE_UNUSED ;
}
for ( int i = 0 ; i < ARRAYSIZE ( m_DeclaredOutputs ) ; i + + )
{
m_DeclaredOutputs [ i ] = UNDECLARED_OUTPUT ;
}
for ( int i = 0 ; i < ARRAYSIZE ( m_DeclaredInputs ) ; i + + )
{
m_DeclaredInputs [ i ] = UNDECLARED_INPUT ;
}
memset ( m_dwAttribMap , 0xFF , sizeof ( m_dwAttribMap ) ) ;
m_pdwBaseToken = m_pdwNextToken = code ; // Initialize dwToken pointers
dwToken = GetNextToken ( ) ;
m_dwMajorVersion = D3DSHADER_VERSION_MAJOR ( dwToken ) ;
m_dwMinorVersion = D3DSHADER_VERSION_MINOR ( dwToken ) ;
// If pixel shader
const char * glslExtText = " \n " ; //#extension GL_ARB_shader_texture_lod : require\n";//m_bUseBindlessTexturing ? "#extension GL_NV_bindless_texture : require\n" : "";
// 7ls
// const char *glslVersionText = m_bUseBindlessTexturing ? "330 compatibility" : "120";
if ( ( dwToken & 0xFFFF0000 ) = = 0xFFFF0000 )
{
// must explicitly enable extensions if emitting GLSL
V_snprintf ( ( char * ) m_pBufHeaderCode - > Base ( ) , m_pBufHeaderCode - > Size ( ) , " #version 300 es \n precision mediump float; \n #define varying in \n \n %s " , glslExtText ) ;
m_bVertexShader = false ;
}
else // vertex shader
{
m_bGenerateSRGBWriteSuffix = false ;
V_snprintf ( ( char * ) m_pBufHeaderCode - > Base ( ) , m_pBufHeaderCode - > Size ( ) , " #version 300 es \n precision mediump float; \n #define attribute in \n #define varying out \n %s//ATTRIBMAP-xx-xx-xx-xx-xx-xx-xx-xx-xx-xx-xx-xx-xx-xx-xx-xx \n " , glslExtText ) ;
// find that first '-xx' which is where the attrib map will be written later.
pAttribMapStart = strstr ( ( char * ) m_pBufHeaderCode - > Base ( ) , " -xx " ) + 1 ;
m_bVertexShader = true ;
}
* bVertexShader = m_bVertexShader ;
m_bGenerateBoneUniformBuffer = m_bVertexShader & & ( ( options & D3DToGL_OptionGenerateBoneUniformBuffer ) ! = 0 ) ;
if ( m_bAddHexCodeComments )
{
RecordInputAndOutputPositions ( ) ;
}
if ( m_bSpew )
{
printf ( " \n ************* translating shader " ) ;
}
int opcounter = 0 ;
// Loop until we hit the end dwToken...note that D3DPS_END() == D3DVS_END() so this works for either
while ( dwToken ! = D3DPS_END ( ) )
{
if ( m_bAddHexCodeComments )
{
AddTokenHexCode ( ) ;
RecordInputAndOutputPositions ( ) ;
}
# ifdef POSIX
int tokenIndex = m_pdwNextToken - code ;
# endif
int aluCodeLength0 = V_strlen ( ( char * ) m_pBufALUCode - > Base ( ) ) ;
dwToken = GetNextToken ( ) ; // Get next dwToken in the stream
nInstruction = Opcode ( dwToken ) ; // Mask out the instruction opcode
if ( m_bSpew )
{
# ifdef POSIX
printf ( " \n ** token# %04x inst# %04d opcode %s (%08x) " , tokenIndex , opcounter , GLMDecode ( eD3D_SIO , nInstruction ) , dwToken ) ;
# endif
opcounter + + ;
}
switch ( nInstruction )
{
// -- No arguments at all -----------------------------------------------
case D3DSIO_NOP :
// D3D compiler outputs NOPs when shader debugging/optimizations are disabled.
break ;
case D3DSIO_PHASE :
case D3DSIO_RET :
case D3DSIO_ENDLOOP :
case D3DSIO_BREAK :
TranslationError ( ) ;
PrintOpcode ( nInstruction , buff , sizeof ( buff ) ) ;
StrcatToALUCode ( buff ) ;
StrcatToALUCode ( " ; \n " ) ;
break ;
// -- "Declarative" non dcl ops ----------------------------------------
case D3DSIO_TEXDEPTH :
case D3DSIO_TEXKILL :
Handle_DeclarativeNonDclOp ( nInstruction ) ;
break ;
// -- Unary ops -------------------------------------------------
case D3DSIO_BEM :
case D3DSIO_TEXBEM :
case D3DSIO_TEXBEML :
case D3DSIO_TEXDP3 :
case D3DSIO_TEXDP3TEX :
case D3DSIO_TEXM3x2DEPTH :
case D3DSIO_TEXM3x2TEX :
case D3DSIO_TEXM3x3 :
case D3DSIO_TEXM3x3PAD :
case D3DSIO_TEXM3x3TEX :
case D3DSIO_TEXM3x3VSPEC :
case D3DSIO_TEXREG2AR :
case D3DSIO_TEXREG2GB :
case D3DSIO_TEXREG2RGB :
case D3DSIO_LABEL :
case D3DSIO_CALL :
case D3DSIO_LOOP :
case D3DSIO_BREAKP :
case D3DSIO_DSX :
case D3DSIO_DSY :
TranslationError ( ) ;
break ;
case D3DSIO_IFC :
{
static const char * s_szCompareStrings [ 7 ] =
{
" __INVALID__ " ,
" > " ,
" == " ,
" >= " ,
" < " ,
" != " ,
" <= "
} ;
// Compare mode is encoded in instruction token
uint32 dwCompareMode = OpcodeSpecificData ( dwToken ) ;
Assert ( ( dwCompareMode > = 1 ) & & ( dwCompareMode < = 6 ) ) ;
// Get left side of compare
dwToken = GetNextToken ( ) ;
char szLeftSide [ 32 ] ;
PrintParameterToString ( dwToken , SRC_REGISTER , szLeftSide , sizeof ( szLeftSide ) , false , NULL ) ;
// Get right side of compare
dwToken = GetNextToken ( ) ;
char szRightSide [ 32 ] ;
PrintParameterToString ( dwToken , SRC_REGISTER , szRightSide , sizeof ( szRightSide ) , false , NULL ) ;
PrintToBufWithIndents ( * m_pBufALUCode , " if ( %s %s %s ) \n " , szLeftSide , s_szCompareStrings [ dwCompareMode ] , szRightSide ) ;
StrcatToALUCode ( " { \n " ) ;
m_NumIndentTabs + + ;
break ;
}
case D3DSIO_IF :
dwToken = GetNextToken ( ) ;
PrintParameterToString ( dwToken , SRC_REGISTER , buff , sizeof ( buff ) , false , NULL ) ;
PrintToBufWithIndents ( * m_pBufALUCode , " if ( %s ) \n " , buff ) ;
StrcatToALUCode ( " { \n " ) ;
m_NumIndentTabs + + ;
break ;
case D3DSIO_ELSE :
m_NumIndentTabs - - ;
StrcatToALUCode ( " } \n " ) ;
StrcatToALUCode ( " else \n " ) ;
StrcatToALUCode ( " { \n " ) ;
m_NumIndentTabs + + ;
break ;
case D3DSIO_ENDIF :
m_NumIndentTabs - - ;
StrcatToALUCode ( " } \n " ) ;
break ;
case D3DSIO_REP :
dwToken = GetNextToken ( ) ;
PrintParameterToString ( dwToken , SRC_REGISTER , buff , sizeof ( buff ) , false , NULL ) ;
// In practice, this is the only form of for loop that will appear in DX asm
PrintToBufWithIndents ( * m_pBufALUCode , " for( int i=0; i < %s; i++ ) \n " , buff ) ;
StrcatToALUCode ( " { \n " ) ;
m_nLoopDepth + + ;
// For now, we don't deal with loop nesting
// Easy enough to fix later with an array of loop names i, j, k etc
Assert ( m_nLoopDepth < = 1 ) ;
m_NumIndentTabs + + ;
break ;
case D3DSIO_ENDREP :
m_nLoopDepth - - ;
m_NumIndentTabs - - ;
StrcatToALUCode ( " } \n " ) ;
break ;
case D3DSIO_NRM :
Handle_NRM ( ) ;
break ;
case D3DSIO_MOVA :
Handle_UnaryOp ( nInstruction ) ;
break ;
// Unary operations
case D3DSIO_MOV :
case D3DSIO_RCP :
case D3DSIO_RSQ :
case D3DSIO_EXP :
case D3DSIO_EXPP :
case D3DSIO_LOG :
case D3DSIO_LOGP :
case D3DSIO_FRC :
case D3DSIO_LIT :
case D3DSIO_ABS :
Handle_UnaryOp ( nInstruction ) ;
break ;
// -- Binary ops -------------------------------------------------
case D3DSIO_TEXM3x3SPEC :
case D3DSIO_M4x4 :
case D3DSIO_M4x3 :
case D3DSIO_M3x4 :
case D3DSIO_M3x3 :
case D3DSIO_M3x2 :
case D3DSIO_CALLNZ :
case D3DSIO_SETP :
TranslationError ( ) ;
break ;
case D3DSIO_BREAKC :
Handle_BREAKC ( dwToken ) ;
break ;
// Binary Operations
case D3DSIO_ADD :
case D3DSIO_SUB :
case D3DSIO_MUL :
case D3DSIO_DP3 :
case D3DSIO_DP4 :
case D3DSIO_MIN :
case D3DSIO_MAX :
case D3DSIO_DST :
case D3DSIO_SLT :
case D3DSIO_SGE :
case D3DSIO_CRS :
case D3DSIO_POW :
HandleBinaryOp_GLSL ( nInstruction ) ;
break ;
// -- Ternary ops -------------------------------------------------
case D3DSIO_DP2ADD :
Handle_DP2ADD ( ) ;
break ;
case D3DSIO_LRP :
Handle_LRP ( nInstruction ) ;
break ;
case D3DSIO_SGN :
Assert ( m_bVertexShader ) ;
TranslationError ( ) ; // TODO emulate with SLT etc
break ;
case D3DSIO_CND :
TranslationError ( ) ;
break ;
case D3DSIO_CMP :
Handle_CMP ( ) ;
break ;
case D3DSIO_SINCOS :
Handle_SINCOS ( ) ;
break ;
case D3DSIO_MAD :
Handle_MAD ( nInstruction ) ;
break ;
// -- Quaternary op ------------------------------------------------
case D3DSIO_TEXLDD :
Handle_TexLDD ( nInstruction ) ;
break ;
// -- Special cases: texcoord vs texcrd and tex vs texld -----------
case D3DSIO_TEXCOORD :
Handle_TexCoord ( ) ;
break ;
case D3DSIO_TEX :
Handle_TEX ( dwToken , false ) ;
break ;
case D3DSIO_TEXLDL :
Handle_TEX ( nInstruction , true ) ;
break ;
case D3DSIO_DCL :
Handle_DCL ( ) ;
break ;
case D3DSIO_DEFB :
case D3DSIO_DEFI :
Handle_DEFIB ( nInstruction ) ;
break ;
case D3DSIO_DEF :
Handle_DEF ( ) ;
break ;
case D3DSIO_COMMENT :
// Using OpcodeSpecificData() can fail here since the comments can be longer than 0xff dwords
nNumTokensToSkip = ( dwToken & 0x0fff0000 ) > > 16 ;
SkipTokens ( nNumTokensToSkip ) ;
break ;
case D3DSIO_END :
break ;
}
if ( m_bSpew )
{
int aluCodeLength1 = V_strlen ( ( char * ) m_pBufALUCode - > Base ( ) ) ;
if ( aluCodeLength1 ! = aluCodeLength0 )
{
// code was emitted
printf ( " \n > %s " , ( ( char * ) m_pBufALUCode - > Base ( ) ) + aluCodeLength0 ) ;
aluCodeLength0 = aluCodeLength1 ;
}
}
}
// Note that this constant packing expects .wzyx swizzles in case we ever use the SINCOS code in a ps_2_x shader
//
// The Microsoft do cumentation on this is all kinds of broken and, strangely, these numbers don't even
// match the D3DSINCOSCONST1 and D3DSINCOSCONST2 constants used by the D3D assembly sincos instruction...
if ( m_bNeedsSinCosDeclarations )
{
PrintIndentation ( ( char * ) m_pBufParamCode - > Base ( ) , m_pBufParamCode - > Size ( ) ) ;
StrcatToParamCode ( " vec4 scA = vec4( -1.55009923e-6, -2.17013894e-5, 0.00260416674, 0.00026041668 ); \n " ) ;
PrintIndentation ( ( char * ) m_pBufParamCode - > Base ( ) , m_pBufParamCode - > Size ( ) ) ;
StrcatToParamCode ( " vec4 scB = vec4( -0.020833334, -0.125, 1.0, 0.5 ); \n " ) ;
}
// Stick in the sampler mask in hex
PrintToBuf ( * m_pBufHeaderCode , " %sSAMPLERMASK-%x \n " , " // " , m_dwSamplerUsageMask ) ;
uint nSamplerTypes = 0 ;
for ( int i = 0 ; i < 16 ; i + + )
{
Assert ( m_dwSamplerTypes [ i ] < 4 ) ;
nSamplerTypes | = ( m_dwSamplerTypes [ i ] < < ( i * 2 ) ) ;
}
PrintToBuf ( * m_pBufHeaderCode , " %sSAMPLERTYPES-%x \n " , " // " , nSamplerTypes ) ;
// fragData outputs referenced
uint nFragDataMask = 0 ;
for ( int i = 0 ; i < 4 ; i + + )
{
nFragDataMask | = m_bOutputColorRegister [ i ] ? ( 1 < < i ) : 0 ;
}
PrintToBuf ( * m_pBufHeaderCode , " %sFRAGDATAMASK-%x \n " , " // " , nFragDataMask ) ;
// Uniforms
PrintToBuf ( * m_pBufHeaderCode , " //HIGHWATER-%d \n " , m_nHighestRegister + 1 ) ;
if ( ( m_bVertexShader ) & & ( m_bGenerateBoneUniformBuffer ) )
{
PrintToBuf ( * m_pBufHeaderCode , " //HIGHWATERBONE-%i \n " , m_nHighestBoneRegister + 1 ) ;
}
PrintToBuf ( * m_pBufHeaderCode , " \n uniform vec4 %s[%d]; \n " , m_bVertexShader ? " vc " : " pc " , m_nHighestRegister + 1 ) ;
if ( ( m_nHighestBoneRegister > = 0 ) & & ( m_bVertexShader ) & & ( m_bGenerateBoneUniformBuffer ) )
{
PrintToBuf ( * m_pBufHeaderCode , " \n uniform vec4 %s[%d]; \n " , " vcbones " , m_nHighestBoneRegister + 1 ) ;
}
if ( m_bVertexShader )
{
PrintToBuf ( * m_pBufHeaderCode , " \n uniform vec4 vcscreen; \n " ) ;
}
for ( int i = 0 ; i < 32 ; i + + )
{
if ( ( m_dwConstIntUsageMask & ( 0x00000001 < < i ) ) & &
( ! ( m_dwDefConstIntUsageMask & ( 0x00000001 < < i ) ) )
)
{
PrintToBuf ( * m_pBufHeaderCode , " uniform int i%d ; \n " , i ) ;
}
}
for ( int i = 0 ; i < 32 ; i + + )
{
if ( m_dwDefConstIntUsageMask & ( 0x00000001 < < i ) )
{
PrintToBuf ( * m_pBufHeaderCode , " const int i%d = %i; \n " , i , m_dwDefConstIntIterCount [ i ] ) ;
}
}
for ( int i = 0 ; i < 32 ; i + + )
{
if ( m_dwConstBoolUsageMask & ( 0x00000001 < < i ) )
{
PrintToBuf ( * m_pBufHeaderCode , m_bVertexShader ? " uniform bool b%d; \n " : " uniform bool fb%d; \n " , i ) ;
}
}
// Control bit for sRGB Write suffix
if ( m_bGenerateSRGBWriteSuffix )
{
// R500 Hookup
// Set this guy to 1 when the sRGBWrite state is true, otherwise 0
StrcatToHeaderCode ( " uniform float flSRGBWrite; \n " ) ;
}
PrintToBuf ( * m_pBufHeaderCode , " \n " ) ;
// Write samplers
WriteGLSLSamplerDefinitions ( ) ;
if ( m_bUsesDSTInstruction )
{
PrintToBuf ( * m_pBufHeaderCode , " vec4 dst(vec4 src0,vec4 src1) { return vec4(1.0f,src0.y*src1.y,src0.z,src1.w); } \n " ) ;
}
if ( m_bDeclareAddressReg )
{
if ( ! m_bGenerateBoneUniformBuffer )
{
m_nHighestRegister = DXABSTRACT_VS_PARAM_SLOTS - 1 ;
}
PrintIndentation ( ( char * ) m_pBufParamCode - > Base ( ) , m_pBufParamCode - > Size ( ) ) ;
StrcatToParamCode ( " vec4 va_r; \n " ) ;
}
char * pTempVarStr = " TEMP " ;
pTempVarStr = " vec4 " ;
// Declare temps in Param code buffer
for ( int i = 0 ; i < 32 ; i + + )
{
if ( m_dwTempUsageMask & ( 0x00000001 < < i ) )
{
PrintIndentation ( ( char * ) m_pBufParamCode - > Base ( ) , m_pBufParamCode - > Size ( ) ) ;
PrintToBuf ( * m_pBufParamCode , " %s r%d; \n " , pTempVarStr , i ) ;
}
}
if ( m_bVertexShader & & ( m_bDoUserClipPlanes | | m_bDoFixupZ | | m_bDoFixupY ) )
{
PrintIndentation ( ( char * ) m_pBufParamCode - > Base ( ) , m_pBufParamCode - > Size ( ) ) ;
StrcatToParamCode ( " vec4 vTempPos; \n " ) ;
}
if ( ( m_bVertexShader ) & & ( m_dwMajorVersion = = 3 ) )
{
for ( int i = 0 ; i < 32 ; i + + )
{
if ( m_dwTexCoordOutMask & ( 1 < < i ) )
{
PrintIndentation ( ( char * ) m_pBufParamCode - > Base ( ) , m_pBufParamCode - > Size ( ) ) ;
char buf [ 256 ] ;
V_snprintf ( buf , sizeof ( buf ) , " vec4 oTempT%i = vec4( 0, 0, 0, 0 ); \n " , i ) ;
StrcatToParamCode ( buf ) ;
}
}
}
if ( m_bNeedsSinCosDeclarations )
{
StrcatToParamCode ( " vec3 vSinCosTmp; \n " ) ; // declare temp used by GLSL sin and cos intrinsics
}
// Optional temps needed to emulate d2add instruction in DX pixel shaders
if ( m_bNeedsD2AddTemp )
{
PrintToBuf ( * m_pBufParamCode , " %s DP2A0; \n %s DP2A1; \n " , pTempVarStr , pTempVarStr ) ;
}
// Optional temp needed to emulate lerp instruction in DX vertex shaders
if ( m_bNeedsLerpTemp )
{
PrintToBuf ( * m_pBufParamCode , " %s LRP_TEMP; \n " , pTempVarStr ) ;
}
// Optional temp needed to emulate NRM instruction in DX shaders
if ( m_bNeedsNRMTemp )
{
PrintToBuf ( * m_pBufParamCode , " %s NRM_TEMP; \n " , pTempVarStr ) ;
}
if ( m_bDeclareVSOPos & & m_bVertexShader )
{
if ( m_bDoUserClipPlanes )
{
// StrcatToALUCode( "gl_ClipVertex = vTempPos;\n" ); // if user clip is enabled, jam clip space position into gl_ClipVertex
}
if ( m_bDoFixupZ | | m_bDoFixupY )
{
// TODO: insert clip distance computation something like this:
//
// StrcatToALUCode( "DP4 oCLP[0].x, oPos, vc[215]; \n" );
//
if ( m_bDoFixupZ )
{
StrcatToALUCode ( " vTempPos.z = vTempPos.z * vc[0].z - vTempPos.w; // z' = (2*z)-w \n " ) ;
}
if ( m_bDoFixupY )
{
// append instructions to flip Y over
// new Y = -(old Y)
StrcatToALUCode ( " vTempPos.y = -vTempPos.y; // y' = -y \n " ) ;
}
// Apply half pixel offset (0.5f pixel offset D3D) to output vertices to account for the pixel center difference between D3D9 and OpenGL.
// This is the actual work in the shader. This works out to be 0.5 pixels wide because clip space is 2 units wide (-1, 1).
StrcatToALUCode ( " vTempPos.xy += vcscreen.xy * vTempPos.w; \n " ) ;
StrcatToALUCode ( " gl_Position = vTempPos; \n " ) ;
}
else
{
StrcatToParamCode ( " OUTPUT oPos = result.position; \n " ) ;
// TODO: insert clip distance computation something like this:
//
// StrcatToALUCode( "DP4 oCLP[0].x, oPos, c[215]; \n" );
//
}
}
if ( m_bVertexShader )
{
if ( m_dwMajorVersion = = 3 )
{
WriteGLSLOutputVariableAssignments ( ) ;
}
else
{
for ( int i = 0 ; i < 32 ; i + + )
{
char outTexCoordBuff [ 64 ] ;
// Don't declare a varying for the output that is mapped to the position output
if ( i ! = m_nVSPositionOutput )
{
if ( m_dwTexCoordOutMask & ( 0x00000001 < < i ) )
{
if ( m_nCentroidMask & ( 0x00000001 < < i ) )
{
V_snprintf ( outTexCoordBuff , sizeof ( outTexCoordBuff ) , " centroid out vec4 oT%d; \n " , i ) ; // centroid varying
StrcatToHeaderCode ( outTexCoordBuff ) ;
}
else
{
V_snprintf ( outTexCoordBuff , sizeof ( outTexCoordBuff ) , " out vec4 oT%d; \n " , i ) ;
StrcatToHeaderCode ( outTexCoordBuff ) ;
}
}
}
}
}
}
else
{
if ( m_dwMajorVersion = = 3 )
{
WriteGLSLInputVariableAssignments ( ) ;
}
}
// do some annotation at the end of the attrib block
{
char temp [ 5000 ] ;
if ( m_bVertexShader )
{
// write attrib map into the text starting at pAttribMapStart - two hex digits per attrib
for ( int i = 0 ; i < 16 ; i + + )
{
if ( m_dwAttribMap [ i ] ! = 0xFFFFFFFF )
{
V_snprintf ( temp , sizeof ( temp ) , " %02X " , m_dwAttribMap [ i ] ) ;
memcpy ( pAttribMapStart + ( i * 3 ) , temp , 2 ) ;
}
}
}
PrintIndentation ( ( char * ) m_pBufAttribCode - > Base ( ) , m_pBufAttribCode - > Size ( ) ) ;
// This used to write out a translation counter into the shader as a comment. However, the order that shaders get in here
// is non-deterministic between runs, and the change in this comment would cause shaders to appear different to the GL disk cache,
// significantly increasing app load time.
// Other code looks for trans#%d, so we can't just remove it. Instead, output it as 0.
V_snprintf ( temp , sizeof ( temp ) , " %s trans#%d label:%s \n " , " // " , 0 , debugLabel ? debugLabel : " none " ) ;
StrcatToAttribCode ( temp ) ;
}
// If we actually sample from a shadow depth sampler, we need to declare the shadow option at the top
if ( m_bDeclareShadowOption )
{
StrcatToHeaderCode ( " OPTION ARB_fragment_program_shadow; \n " ) ;
}
if ( m_iFragDataCount | | m_bGenerateSRGBWriteSuffix )
{
char buf [ 256 ] ;
snprintf ( buf , sizeof buf , " out vec4 _gl_FragData[%d]; \n #define gl_FragData _gl_FragData \n " , m_iFragDataCount ) ;
StrcatToHeaderCode ( buf ) ;
}
# define FindSubcode(a) (V_strstr((char*)m_pBufALUCode->Base(), a) != 0 || V_strstr((char*)m_pBufHeaderCode->Base(), a) != 0 || V_strstr((char*)m_pBufParamCode->Base(), a) != 0 || V_strstr((char*)m_pBufAttribCode->Base(), a) != 0 )
if ( FindSubcode ( " shadow2DProj " ) )
{
StrcatToHeaderCode ( g_szShadow2D ) ;
StrcatToHeaderCode ( g_szShadow2DProj ) ;
}
else if ( FindSubcode ( " shadow2D " ) )
StrcatToHeaderCode ( g_szShadow2D ) ;
if ( FindSubcode ( " _gl_FrontColor " ) & & ! m_bFrontColor )
StrcatToHeaderCode ( " in vec4 _gl_FrontColor; \n " ) ;
if ( FindSubcode ( " _gl_FrontSecondaryColor " ) & & ! m_bFrontSecondaryColor )
StrcatToHeaderCode ( " in vec4 _gl_FrontSecondaryColor; \n " ) ;
if ( m_iFragDataCount & & bVertexShader )
StrcatToHeaderCode ( " \n uniform float alpha_ref; \n " ) ;
StrcatToHeaderCode ( " \n void main() \n { \n " ) ;
if ( m_bUsedAtomicTempVar )
{
PrintToBufWithIndents ( * m_pBufHeaderCode , " vec4 %s; \n \n " , g_pAtomicTempVarName ) ;
}
// sRGB Write suffix
if ( m_bGenerateSRGBWriteSuffix )
{
// StrcatToALUCode( "vec3 sRGBFragData;\n" );
// StrcatToALUCode( "sRGBFragData.xyz = log( gl_FragData[0].xyz );\n" );
// StrcatToALUCode( "sRGBFragData.xyz = sRGBFragData.xyz * vec3( 0.754545f, 0.754545f, 0.754545f );\n" );
// StrcatToALUCode( "sRGBFragData.xyz = exp( sRGBFragData.xyz );\n" );
StrcatToALUCode ( " gl_FragData[0].xyz = pow(gl_FragData[0].xyz, vec3(1.0/2.2)); \n " ) ;
}
if ( m_iFragDataCount & & bVertexShader )
StrcatToALUCode ( " if( gl_FragData[0].a < alpha_ref ) { discard; }; \n " ) ;
strcat_s ( ( char * ) m_pBufALUCode - > Base ( ) , m_pBufALUCode - > Size ( ) , " } \n " ) ;
// Put all of the strings together for final program ( pHeaderCode + pAttribCode + pParamCode + pALUCode )
StrcatToHeaderCode ( ( char * ) m_pBufAttribCode - > Base ( ) ) ;
StrcatToHeaderCode ( ( char * ) m_pBufParamCode - > Base ( ) ) ;
StrcatToHeaderCode ( ( char * ) m_pBufALUCode - > Base ( ) ) ;
// Cleanup - don't touch m_pBufHeaderCode, as it is managed by the caller
delete m_pBufAttribCode ;
delete m_pBufParamCode ;
delete m_pBufALUCode ;
m_pBufAttribCode = m_pBufParamCode = m_pBufALUCode = NULL ;
if ( m_bSpew )
{
printf ( " \n ************* translation complete \n \n " ) ;
}
return DISASM_OK ;
}