Fixed GTE GPL & DCPL opcodes by porting over some changes from an old tree [smf]

This commit is contained in:
smf- 2013-04-07 20:38:53 +00:00
parent cec306dbdf
commit 478bfd6391
2 changed files with 303 additions and 191 deletions

View File

@ -1,7 +1,7 @@
/*
* PlayStation Geometry Transformation Engine emulator
*
* Copyright 2003-2011 smf
* Copyright 2003-2013 smf
*
* divider reverse engineering by pSXAuthor.
*
@ -279,17 +279,17 @@ void gte::setcp2cr( UINT32 pc, int reg, UINT32 value )
m_cp2cr[ reg ].d = value;
}
INT64 gte::BOUNDS( INT64 n_value, INT64 n_max, int n_maxflag, INT64 n_min, int n_minflag )
INT64 gte::BOUNDS( INT64 value, INT64 max, int max_flag, INT64 min, int min_flag )
{
if( n_value > n_max )
if( value > max )
{
FLAG |= n_maxflag;
FLAG |= max_flag;
}
else if( n_value < n_min )
else if( value < min )
{
FLAG |= n_minflag;
FLAG |= min_flag;
}
return n_value;
return value;
}
static const UINT16 reciprocals[ 32768 ]=
@ -2365,18 +2365,61 @@ INLINE UINT32 gte_divide( INT16 numerator, UINT16 denominator )
return 0xffffffff;
}
INLINE INT64 gte_shift( INT64 a, int sf )
{
if( sf > 0 )
{
return a >> 12;
}
else if( sf < 0 )
{
return a << 12;
}
return a;
}
/* Setting bits 12 & 19-22 in FLAG does not set bit 31 */
#define A1( a ) BOUNDS( ( a ), 0x7fffffff, ( 1 << 31 ) | ( 1 << 30 ), -(INT64)0x80000000, ( 1 << 31 ) | ( 1 << 27 ) )
#define A2( a ) BOUNDS( ( a ), 0x7fffffff, ( 1 << 31 ) | ( 1 << 29 ), -(INT64)0x80000000, ( 1 << 31 ) | ( 1 << 26 ) )
#define A3( a ) BOUNDS( ( a ), 0x7fffffff, ( 1 << 31 ) | ( 1 << 28 ), -(INT64)0x80000000, ( 1 << 31 ) | ( 1 << 25 ) )
#define Lm_B1( a, l ) LIM( ( a ), 0x7fff, -0x8000 * !l, ( 1 << 31 ) | ( 1 << 24 ) )
#define Lm_B2( a, l ) LIM( ( a ), 0x7fff, -0x8000 * !l, ( 1 << 31 ) | ( 1 << 23 ) )
#define Lm_B3( a, l ) LIM( ( a ), 0x7fff, -0x8000 * !l, ( 1 << 22 ) )
#define Lm_C1( a ) LIM( ( a ), 0x00ff, 0x0000, ( 1 << 21 ) )
#define Lm_C2( a ) LIM( ( a ), 0x00ff, 0x0000, ( 1 << 20 ) )
#define Lm_C3( a ) LIM( ( a ), 0x00ff, 0x0000, ( 1 << 19 ) )
#define Lm_D( a ) LIM( ( a ), 0xffff, 0x0000, ( 1 << 31 ) | ( 1 << 18 ) )
INT64 gte::A1( INT64 a ) { return BOUNDS( ( a ), U64(0x7ffffffffff), ( 1 << 31 ) | ( 1 << 30 ), U64(-0x80000000000), ( 1 << 31 ) | ( 1 << 27 ) ); }
INT64 gte::A2( INT64 a ) { return BOUNDS( ( a ), U64(0x7ffffffffff), ( 1 << 31 ) | ( 1 << 29 ), U64(-0x80000000000), ( 1 << 31 ) | ( 1 << 26 ) ); }
INT64 gte::A3( INT64 a ) { return BOUNDS( ( a ), U64(0x7ffffffffff), ( 1 << 31 ) | ( 1 << 28 ), U64(-0x80000000000), ( 1 << 31 ) | ( 1 << 25 ) ); }
INT32 gte::Lm_B1( INT32 a, int lm ) { return LIM( ( a ), 0x7fff, -0x8000 * !lm, ( 1 << 31 ) | ( 1 << 24 ) ); }
INT32 gte::Lm_B2( INT32 a, int lm ) { return LIM( ( a ), 0x7fff, -0x8000 * !lm, ( 1 << 31 ) | ( 1 << 23 ) ); }
INT32 gte::Lm_B3( INT32 a, int lm ) { return LIM( ( a ), 0x7fff, -0x8000 * !lm, ( 1 << 22 ) ); }
INT32 gte::Lm_B3_sf( INT64 value, int sf, int lm )
{
INT32 value_sf = gte_shift( value, sf );
INT32 value_12 = gte_shift( value, 1 );
int max = 0x7fff;
int min = 0;
if( lm == 0 )
{
min = -0x8000;
}
if( value_12 < -0x8000 || value_12 > 0x7fff )
{
FLAG |= ( 1 << 22 );
}
if( value_sf > max )
{
return max;
}
else if( value_sf < min )
{
return min;
}
return value_sf;
}
INT32 gte::Lm_C1( INT32 a ) { return LIM( ( a ), 0x00ff, 0x0000, ( 1 << 21 ) ); }
INT32 gte::Lm_C2( INT32 a ) { return LIM( ( a ), 0x00ff, 0x0000, ( 1 << 20 ) ); }
INT32 gte::Lm_C3( INT32 a ) { return LIM( ( a ), 0x00ff, 0x0000, ( 1 << 19 ) ); }
INT32 gte::Lm_D( INT32 a ) { return LIM( ( a ), 0xffff, 0x0000, ( 1 << 31 ) | ( 1 << 18 ) ); }
UINT32 gte::Lm_E( UINT32 result )
{
@ -2389,49 +2432,78 @@ UINT32 gte::Lm_E( UINT32 result )
return result;
}
#define F( a ) BOUNDS( ( a ), 0x7fffffff, ( 1 << 31 ) | ( 1 << 16 ), -(INT64)0x80000000, ( 1 << 31 ) | ( 1 << 15 ) )
#define Lm_G1( a ) LIM( ( a ), 0x3ff, -0x400, ( 1 << 31 ) | ( 1 << 14 ) )
#define Lm_G2( a ) LIM( ( a ), 0x3ff, -0x400, ( 1 << 31 ) | ( 1 << 13 ) )
#define Lm_H( a ) LIM( ( a ), 0xfff, 0x000, ( 1 << 12 ) )
INT64 gte::F( INT64 a ) { return BOUNDS( ( a ), U64(0x7fffffff), ( 1 << 31 ) | ( 1 << 16 ), U64(-0x80000000), ( 1 << 31 ) | ( 1 << 15 ) ); }
INT32 gte::Lm_G1( INT32 a ) { return LIM( ( a ), 0x3ff, -0x400, ( 1 << 31 ) | ( 1 << 14 ) ); }
INT32 gte::Lm_G2( INT32 a ) { return LIM( ( a ), 0x3ff, -0x400, ( 1 << 31 ) | ( 1 << 13 ) ); }
INT32 gte::Lm_H( INT64 value, int sf )
{
INT64 value_sf = gte_shift( value, sf );
INT32 value_12 = gte_shift( value, 1 );
int max = 0x1000;
int min = 0x0000;
if( value_sf < min || value_sf > max )
{
FLAG |= ( 1 << 12 );
}
if( value_12 > max )
{
return max;
}
else if( value_12 < min )
{
return min;
}
return value_12;
}
int gte::docop2( UINT32 pc, int gteop )
{
int shift;
int sf;
int v;
int lm;
int cv;
int mx;
INT32 h_over_sz3;
INT64 mac0;
INT64 mac1;
INT64 mac2;
INT64 mac3;
switch( GTE_FUNCT( gteop ) )
{
case 0x01:
if( gteop == 0x0180001 )
{
GTELOG( pc, "%08x RTPS", gteop );
FLAG = 0;
GTELOG( pc, "%08x RTPS", gteop );
FLAG = 0;
MAC1 = A1( ( ( (INT64) TRX << 12 ) + ( R11 * VX0 ) + ( R12 * VY0 ) + ( R13 * VZ0 ) ) >> 12 );
MAC2 = A2( ( ( (INT64) TRY << 12 ) + ( R21 * VX0 ) + ( R22 * VY0 ) + ( R23 * VZ0 ) ) >> 12 );
MAC3 = A3( ( ( (INT64) TRZ << 12 ) + ( R31 * VX0 ) + ( R32 * VY0 ) + ( R33 * VZ0 ) ) >> 12 );
IR1 = Lm_B1( MAC1, 0 );
IR2 = Lm_B2( MAC2, 0 );
IR3 = Lm_B3( MAC3, 0 );
SZ0 = SZ1;
SZ1 = SZ2;
SZ2 = SZ3;
SZ3 = Lm_D( MAC3 );
h_over_sz3 = Lm_E( gte_divide( H, SZ3 ) );
SXY0 = SXY1;
SXY1 = SXY2;
SX2 = Lm_G1( F( (INT64) OFX + ( (INT64) IR1 * h_over_sz3 ) ) >> 16 );
SY2 = Lm_G2( F( (INT64) OFY + ( (INT64) IR2 * h_over_sz3 ) ) >> 16 );
MAC0 = F( (INT64) DQB + ( (INT64) DQA * h_over_sz3 ) );
IR0 = Lm_H( MAC0 >> 12 );
return 1;
}
break;
sf = GTE_SF( gteop );
lm = GTE_LM( gteop );
mac1 = A1( ( (INT64) TRX << 12 ) + ( R11 * VX0 ) + ( R12 * VY0 ) + ( R13 * VZ0 ) );
mac2 = A2( ( (INT64) TRY << 12 ) + ( R21 * VX0 ) + ( R22 * VY0 ) + ( R23 * VZ0 ) );
mac3 = A3( ( (INT64) TRZ << 12 ) + ( R31 * VX0 ) + ( R32 * VY0 ) + ( R33 * VZ0 ) );
MAC1 = gte_shift( mac1, sf );
MAC2 = gte_shift( mac2, sf );
MAC3 = gte_shift( mac3, sf );
IR1 = Lm_B1( MAC1, lm );
IR2 = Lm_B2( MAC2, lm );
IR3 = Lm_B3_sf( mac3, sf, lm );
SZ0 = SZ1;
SZ1 = SZ2;
SZ2 = SZ3;
SZ3 = Lm_D( gte_shift( mac3, 1 ) );
h_over_sz3 = Lm_E( gte_divide( H, SZ3 ) );
SXY0 = SXY1;
SXY1 = SXY2;
SX2 = Lm_G1( F( (INT64) OFX + ( (INT64) IR1 * h_over_sz3 ) ) >> 16 );
SY2 = Lm_G2( F( (INT64) OFY + ( (INT64) IR2 * h_over_sz3 ) ) >> 16 );
mac0 = F( (INT64) DQB + ( (INT64) DQA * h_over_sz3 ) );
MAC0 = mac0;
IR0 = Lm_H( mac0, 1 );
return 1;
case 0x06:
GTELOG( pc, "%08x NCLIP", gteop );
@ -2444,12 +2516,15 @@ int gte::docop2( UINT32 pc, int gteop )
GTELOG( pc, "%08x OP", gteop );
FLAG = 0;
shift = 12 * GTE_SF( gteop );
sf = GTE_SF( gteop );
lm = GTE_LM( gteop );
MAC1 = A1( ( (INT64) ( R22 * IR3 ) - ( R33 * IR2 ) ) >> shift );
MAC2 = A2( ( (INT64) ( R33 * IR1 ) - ( R11 * IR3 ) ) >> shift );
MAC3 = A3( ( (INT64) ( R11 * IR2 ) - ( R22 * IR1 ) ) >> shift );
mac1 = A1( (INT64) ( R22 * IR3 ) - ( R33 * IR2 ) );
mac2 = A2( (INT64) ( R33 * IR1 ) - ( R11 * IR3 ) );
mac3 = A3( (INT64) ( R11 * IR2 ) - ( R22 * IR1 ) );
MAC1 = gte_shift( mac1, sf );
MAC2 = gte_shift( mac2, sf );
MAC3 = gte_shift( mac3, sf );
IR1 = Lm_B1( MAC1, lm );
IR2 = Lm_B2( MAC2, lm );
IR3 = Lm_B3( MAC3, lm );
@ -2459,12 +2534,15 @@ int gte::docop2( UINT32 pc, int gteop )
GTELOG( pc, "%08x DPCS", gteop );
FLAG = 0;
shift = 12 * GTE_SF( gteop );
sf = GTE_SF( gteop );
lm = GTE_LM( gteop );
MAC1 = ( ( R << 16 ) + ( IR0 * Lm_B1( A1( (INT64) RFC - ( R << 4 ) ) << ( 12 - shift ), 0 ) ) ) >> shift;
MAC2 = ( ( G << 16 ) + ( IR0 * Lm_B2( A2( (INT64) GFC - ( G << 4 ) ) << ( 12 - shift ), 0 ) ) ) >> shift;
MAC3 = ( ( B << 16 ) + ( IR0 * Lm_B3( A3( (INT64) BFC - ( B << 4 ) ) << ( 12 - shift ), 0 ) ) ) >> shift;
mac1 = ( ( R << 16 ) + ( IR0 * Lm_B1( gte_shift( A1( ( (INT64) RFC << 12 ) - ( R << 16 ) ), sf ), 0 ) ) );
mac2 = ( ( G << 16 ) + ( IR0 * Lm_B2( gte_shift( A2( ( (INT64) GFC << 12 ) - ( G << 16 ) ), sf ), 0 ) ) );
mac3 = ( ( B << 16 ) + ( IR0 * Lm_B3( gte_shift( A3( ( (INT64) BFC << 12 ) - ( B << 16 ) ), sf ), 0 ) ) );
MAC1 = gte_shift( mac1, sf );
MAC2 = gte_shift( mac2, sf );
MAC3 = gte_shift( mac3, sf );
IR1 = Lm_B1( MAC1, lm );
IR2 = Lm_B2( MAC2, lm );
IR3 = Lm_B3( MAC3, lm );
@ -2480,12 +2558,15 @@ int gte::docop2( UINT32 pc, int gteop )
GTELOG( pc, "%08x INTPL", gteop );
FLAG = 0;
shift = 12 * GTE_SF( gteop );
sf = GTE_SF( gteop );
lm = GTE_LM( gteop );
MAC1 = ( ( IR1 << 12 ) + ( IR0 * Lm_B1( A1( (INT64) RFC - IR1 ) << ( 12 - shift ), 0 ) ) ) >> shift;
MAC2 = ( ( IR2 << 12 ) + ( IR0 * Lm_B2( A2( (INT64) GFC - IR2 ) << ( 12 - shift ), 0 ) ) ) >> shift;
MAC3 = ( ( IR3 << 12 ) + ( IR0 * Lm_B3( A3( (INT64) BFC - IR3 ) << ( 12 - shift ), 0 ) ) ) >> shift;
mac1 = ( ( IR1 << 12 ) + ( IR0 * Lm_B1( gte_shift( A1( ( (INT64) RFC << 12 ) - ( IR1 << 12 ) ), sf ), 0 ) ) );
mac2 = ( ( IR2 << 12 ) + ( IR0 * Lm_B2( gte_shift( A2( ( (INT64) GFC << 12 ) - ( IR2 << 12 ) ), sf ), 0 ) ) );
mac3 = ( ( IR3 << 12 ) + ( IR0 * Lm_B3( gte_shift( A3( ( (INT64) BFC << 12 ) - ( IR3 << 12 ) ), sf ), 0 ) ) );
MAC1 = gte_shift( mac1, sf );
MAC2 = gte_shift( mac2, sf );
MAC3 = gte_shift( mac3, sf );
IR1 = Lm_B1( MAC1, lm );
IR2 = Lm_B2( MAC2, lm );
IR3 = Lm_B3( MAC3, lm );
@ -2498,27 +2579,25 @@ int gte::docop2( UINT32 pc, int gteop )
return 1;
case 0x12:
if( GTE_OP( gteop ) == 0x04 )
{
GTELOG( pc, "%08x MVMVA", gteop );
shift = 12 * GTE_SF( gteop );
mx = GTE_MX( gteop );
v = GTE_V( gteop );
cv = GTE_CV( gteop );
lm = GTE_LM( gteop );
GTELOG( pc, "%08x MVMVA", gteop );
FLAG = 0;
FLAG = 0;
mx = GTE_MX( gteop );
v = GTE_V( gteop );
cv = GTE_CV( gteop );
sf = GTE_SF( gteop );
lm = GTE_LM( gteop );
MAC1 = A1( ( ( (INT64) CV1( cv ) << 12 ) + ( MX11( mx ) * VX( v ) ) + ( MX12( mx ) * VY( v ) ) + ( MX13( mx ) * VZ( v ) ) ) >> shift );
MAC2 = A2( ( ( (INT64) CV2( cv ) << 12 ) + ( MX21( mx ) * VX( v ) ) + ( MX22( mx ) * VY( v ) ) + ( MX23( mx ) * VZ( v ) ) ) >> shift );
MAC3 = A3( ( ( (INT64) CV3( cv ) << 12 ) + ( MX31( mx ) * VX( v ) ) + ( MX32( mx ) * VY( v ) ) + ( MX33( mx ) * VZ( v ) ) ) >> shift );
IR1 = Lm_B1( MAC1, lm );
IR2 = Lm_B2( MAC2, lm );
IR3 = Lm_B3( MAC3, lm );
return 1;
}
break;
mac1 = A1( ( (INT64) CV1( cv ) << 12 ) + ( MX11( mx ) * VX( v ) ) + ( MX12( mx ) * VY( v ) ) + ( MX13( mx ) * VZ( v ) ) );
mac2 = A2( ( (INT64) CV2( cv ) << 12 ) + ( MX21( mx ) * VX( v ) ) + ( MX22( mx ) * VY( v ) ) + ( MX23( mx ) * VZ( v ) ) );
mac3 = A3( ( (INT64) CV3( cv ) << 12 ) + ( MX31( mx ) * VX( v ) ) + ( MX32( mx ) * VY( v ) ) + ( MX33( mx ) * VZ( v ) ) );
MAC1 = gte_shift( mac1, sf );
MAC2 = gte_shift( mac2, sf );
MAC3 = gte_shift( mac3, sf );
IR1 = Lm_B1( MAC1, lm );
IR2 = Lm_B2( MAC2, lm );
IR3 = Lm_B3( MAC3, lm );
return 1;
case 0x13:
if( gteop == 0x0e80413 )
@ -2710,85 +2789,98 @@ int gte::docop2( UINT32 pc, int gteop )
break;
case 0x20:
if( gteop == 0x0d80420 )
{
GTELOG( pc, "%08x NCT", gteop );
FLAG = 0;
for( v = 0; v < 3; v++ )
{
MAC1 = A1( ( ( (INT64) L11 * VX( v ) ) + ( L12 * VY( v ) ) + ( L13 * VZ( v ) ) ) >> 12 );
MAC2 = A2( ( ( (INT64) L21 * VX( v ) ) + ( L22 * VY( v ) ) + ( L23 * VZ( v ) ) ) >> 12 );
MAC3 = A3( ( ( (INT64) L31 * VX( v ) ) + ( L32 * VY( v ) ) + ( L33 * VZ( v ) ) ) >> 12 );
IR1 = Lm_B1( MAC1, 1 );
IR2 = Lm_B2( MAC2, 1 );
IR3 = Lm_B3( MAC3, 1 );
MAC1 = A1( ( ( (INT64) RBK << 12 ) + ( LR1 * IR1 ) + ( LR2 * IR2 ) + ( LR3 * IR3 ) ) >> 12 );
MAC2 = A2( ( ( (INT64) GBK << 12 ) + ( LG1 * IR1 ) + ( LG2 * IR2 ) + ( LG3 * IR3 ) ) >> 12 );
MAC3 = A3( ( ( (INT64) BBK << 12 ) + ( LB1 * IR1 ) + ( LB2 * IR2 ) + ( LB3 * IR3 ) ) >> 12 );
IR1 = Lm_B1( MAC1, 1 );
IR2 = Lm_B2( MAC2, 1 );
IR3 = Lm_B3( MAC3, 1 );
RGB0 = RGB1;
RGB1 = RGB2;
CD2 = CODE;
R2 = Lm_C1( MAC1 >> 4 );
G2 = Lm_C2( MAC2 >> 4 );
B2 = Lm_C3( MAC3 >> 4 );
}
return 1;
}
break;
case 0x28:
GTELOG( pc, "%08x SQR", gteop );
GTELOG( pc, "%08x NCT", gteop );
FLAG = 0;
shift = 12 * GTE_SF( gteop );
sf = GTE_SF( gteop );
lm = GTE_LM( gteop );
MAC1 = A1( ( IR1 * IR1 ) >> shift );
MAC2 = A2( ( IR2 * IR2 ) >> shift );
MAC3 = A3( ( IR3 * IR3 ) >> shift );
IR1 = Lm_B1( MAC1, lm );
IR2 = Lm_B2( MAC2, lm );
IR3 = Lm_B3( MAC3, lm );
return 1;
case 0x29:
if( gteop == 0x0680029 )
for( v = 0; v < 3; v++ )
{
GTELOG( pc, "%08x DPCL", gteop );
FLAG = 0;
MAC1 = A1( ( ( ( (INT64) R << 4 ) * IR1 ) + ( IR0 * Lm_B1( RFC - ( ( R * IR1 ) >> 8 ), 0 ) ) ) >> 12 );
MAC2 = A2( ( ( ( (INT64) G << 4 ) * IR2 ) + ( IR0 * Lm_B2( GFC - ( ( G * IR2 ) >> 8 ), 0 ) ) ) >> 12 );
MAC3 = A3( ( ( ( (INT64) B << 4 ) * IR3 ) + ( IR0 * Lm_B3( BFC - ( ( B * IR3 ) >> 8 ), 0 ) ) ) >> 12 );
IR1 = Lm_B1( MAC1, 1 );
IR2 = Lm_B2( MAC2, 1 );
IR3 = Lm_B3( MAC3, 1 );
mac1 = A1( (INT64) ( L11 * VX( v ) ) + ( L12 * VY( v ) ) + ( L13 * VZ( v ) ) );
mac2 = A2( (INT64) ( L21 * VX( v ) ) + ( L22 * VY( v ) ) + ( L23 * VZ( v ) ) );
mac3 = A3( (INT64) ( L31 * VX( v ) ) + ( L32 * VY( v ) ) + ( L33 * VZ( v ) ) );
MAC1 = gte_shift( mac1, sf );
MAC2 = gte_shift( mac2, sf );
MAC3 = gte_shift( mac3, sf );
IR1 = Lm_B1( MAC1, lm );
IR2 = Lm_B2( MAC2, lm );
IR3 = Lm_B3( MAC3, lm );
mac1 = A1( ( (INT64) RBK << 12 ) + ( LR1 * IR1 ) + ( LR2 * IR2 ) + ( LR3 * IR3 ) );
mac2 = A2( ( (INT64) GBK << 12 ) + ( LG1 * IR1 ) + ( LG2 * IR2 ) + ( LG3 * IR3 ) );
mac3 = A3( ( (INT64) BBK << 12 ) + ( LB1 * IR1 ) + ( LB2 * IR2 ) + ( LB3 * IR3 ) );
MAC1 = gte_shift( mac1, sf );
MAC2 = gte_shift( mac2, sf );
MAC3 = gte_shift( mac3, sf );
IR1 = Lm_B1( MAC1, lm );
IR2 = Lm_B2( MAC2, lm );
IR3 = Lm_B3( MAC3, lm );
RGB0 = RGB1;
RGB1 = RGB2;
CD2 = CODE;
R2 = Lm_C1( MAC1 >> 4 );
G2 = Lm_C2( MAC2 >> 4 );
B2 = Lm_C3( MAC3 >> 4 );
return 1;
}
break;
return 1;
case 0x28:
GTELOG( pc, "%08x SQR", gteop );
FLAG = 0;
sf = GTE_SF( gteop );
lm = GTE_LM( gteop );
mac1 = A1( IR1 * IR1 );
mac2 = A2( IR2 * IR2 );
mac3 = A3( IR3 * IR3 );
MAC1 = gte_shift( mac1, sf );
MAC2 = gte_shift( mac2, sf );
MAC3 = gte_shift( mac3, sf );
IR1 = Lm_B1( MAC1, lm );
IR2 = Lm_B2( MAC2, lm );
IR3 = Lm_B3( MAC3, lm );
return 1;
case 0x29:
GTELOG( pc, "%08x DPCL", gteop );
FLAG = 0;
sf = GTE_SF( gteop );
lm = GTE_LM( gteop );
mac1 = ( ( ( R << 4 ) * IR1 ) + ( IR0 * Lm_B1( gte_shift( A1( ( (INT64) RFC << 12 ) - ( ( R << 4 ) * IR1 ) ), sf ), 0 ) ) );
mac2 = ( ( ( G << 4 ) * IR2 ) + ( IR0 * Lm_B2( gte_shift( A2( ( (INT64) GFC << 12 ) - ( ( G << 4 ) * IR2 ) ), sf ), 0 ) ) );
mac3 = ( ( ( B << 4 ) * IR3 ) + ( IR0 * Lm_B3( gte_shift( A3( ( (INT64) BFC << 12 ) - ( ( B << 4 ) * IR3 ) ), sf ), 0 ) ) );
MAC1 = gte_shift( mac1, sf );
MAC2 = gte_shift( mac2, sf );
MAC3 = gte_shift( mac3, sf );
IR1 = Lm_B1( MAC1, lm );
IR2 = Lm_B2( MAC2, lm );
IR3 = Lm_B3( MAC3, lm );
RGB0 = RGB1;
RGB1 = RGB2;
CD2 = CODE;
R2 = Lm_C1( MAC1 >> 4 );
G2 = Lm_C2( MAC2 >> 4 );
B2 = Lm_C3( MAC3 >> 4 );
return 1;
case 0x2a:
GTELOG( pc, "%08x DPCT", gteop );
FLAG = 0;
shift = 12 * GTE_SF( gteop );
sf = GTE_SF( gteop );
lm = GTE_LM( gteop );
for( v = 0; v < 3; v++ )
{
MAC1 = ( ( R0 << 16 ) + ( IR0 * Lm_B1( A1( (INT64) RFC - ( R0 << 4 ) ) << ( 12 - shift ), 0 ) ) ) >> shift;
MAC2 = ( ( G0 << 16 ) + ( IR0 * Lm_B2( A2( (INT64) GFC - ( G0 << 4 ) ) << ( 12 - shift ), 0 ) ) ) >> shift;
MAC3 = ( ( B0 << 16 ) + ( IR0 * Lm_B3( A3( (INT64) BFC - ( B0 << 4 ) ) << ( 12 - shift ), 0 ) ) ) >> shift;
mac1 = ( ( R0 << 16 ) + ( IR0 * Lm_B1( gte_shift( A1( ( (INT64) RFC << 12 ) - ( R0 << 16 ) ), sf ), 0 ) ) );
mac2 = ( ( G0 << 16 ) + ( IR0 * Lm_B2( gte_shift( A2( ( (INT64) GFC << 12 ) - ( G0 << 16 ) ), sf ), 0 ) ) );
mac3 = ( ( B0 << 16 ) + ( IR0 * Lm_B3( gte_shift( A3( ( (INT64) BFC << 12 ) - ( B0 << 16 ) ), sf ), 0 ) ) );
MAC1 = gte_shift( mac1, sf );
MAC2 = gte_shift( mac2, sf );
MAC3 = gte_shift( mac3, sf );
IR1 = Lm_B1( MAC1, lm );
IR2 = Lm_B2( MAC2, lm );
IR3 = Lm_B3( MAC3, lm );
@ -2805,62 +2897,66 @@ int gte::docop2( UINT32 pc, int gteop )
GTELOG( pc, "%08x AVSZ3", gteop );
FLAG = 0;
mac0 = F( (INT64) ( ZSF3 * SZ1 ) + ( ZSF3 * SZ2 ) + ( ZSF3 * SZ3 ) );
OTZ = Lm_D( mac0 >> 12 );
mac0 = F( (INT64)( ZSF3 * SZ1 ) + ( ZSF3 * SZ2 ) + ( ZSF3 * SZ3 ) );
MAC0 = mac0;
OTZ = Lm_D( mac0 >> 12 );
return 1;
case 0x2e:
GTELOG( pc, "%08x AVSZ4", gteop );
FLAG = 0;
mac0 = F( (INT64) ( ZSF4 * SZ0 ) + ( ZSF4 * SZ1 ) + ( ZSF4 * SZ2 ) + ( ZSF4 * SZ3 ) );
OTZ = Lm_D( mac0 >> 12 );
mac0 = F( (INT64)( ZSF4 * SZ0 ) + ( ZSF4 * SZ1 ) + ( ZSF4 * SZ2 ) + ( ZSF4 * SZ3 ) );
MAC0 = mac0;
OTZ = Lm_D( mac0 >> 12 );
return 1;
case 0x30:
if( gteop == 0x0280030 )
{
GTELOG( pc, "%08x RTPT", gteop );
FLAG = 0;
GTELOG( pc, "%08x RTPT", gteop );
FLAG = 0;
for( v = 0; v < 3; v++ )
{
MAC1 = A1( ( ( (INT64) TRX << 12 ) + ( R11 * VX( v ) ) + ( R12 * VY( v ) ) + ( R13 * VZ( v ) ) ) >> 12 );
MAC2 = A2( ( ( (INT64) TRY << 12 ) + ( R21 * VX( v ) ) + ( R22 * VY( v ) ) + ( R23 * VZ( v ) ) ) >> 12 );
MAC3 = A3( ( ( (INT64) TRZ << 12 ) + ( R31 * VX( v ) ) + ( R32 * VY( v ) ) + ( R33 * VZ( v ) ) ) >> 12 );
IR1 = Lm_B1( MAC1, 0 );
IR2 = Lm_B2( MAC2, 0 );
IR3 = Lm_B3( MAC3, 0 );
SZ0 = SZ1;
SZ1 = SZ2;
SZ2 = SZ3;
SZ3 = Lm_D( MAC3 );
h_over_sz3 = Lm_E( gte_divide( H, SZ3 ) );
SXY0 = SXY1;
SXY1 = SXY2;
SX2 = Lm_G1( F( ( (INT64) OFX + ( (INT64) IR1 * h_over_sz3 ) ) >> 16 ) );
SY2 = Lm_G2( F( ( (INT64) OFY + ( (INT64) IR2 * h_over_sz3 ) ) >> 16 ) );
MAC0 = F( (INT64) DQB + ( (INT64) DQA * h_over_sz3 ) );
IR0 = Lm_H( MAC0 >> 12 );
}
return 1;
sf = GTE_SF( gteop );
lm = GTE_LM( gteop );
for( v = 0; v < 3; v++ )
{
mac1 = A1( ( (INT64) TRX << 12 ) + ( R11 * VX( v ) ) + ( R12 * VY( v ) ) + ( R13 * VZ( v ) ) );
mac2 = A2( ( (INT64) TRY << 12 ) + ( R21 * VX( v ) ) + ( R22 * VY( v ) ) + ( R23 * VZ( v ) ) );
mac3 = A3( ( (INT64) TRZ << 12 ) + ( R31 * VX( v ) ) + ( R32 * VY( v ) ) + ( R33 * VZ( v ) ) );
MAC1 = gte_shift( mac1, sf );
MAC2 = gte_shift( mac2, sf );
MAC3 = gte_shift( mac3, sf );
IR1 = Lm_B1( MAC1, lm );
IR2 = Lm_B2( MAC2, lm );
IR3 = Lm_B3_sf( mac3, sf, lm );
SZ0 = SZ1;
SZ1 = SZ2;
SZ2 = SZ3;
SZ3 = Lm_D( gte_shift( mac3, 1 ) );
h_over_sz3 = Lm_E( gte_divide( H, SZ3 ) );
SXY0 = SXY1;
SXY1 = SXY2;
SX2 = Lm_G1( F( (INT64) OFX + ( (INT64) IR1 * h_over_sz3 ) ) >> 16 );
SY2 = Lm_G2( F( (INT64) OFY + ( (INT64) IR2 * h_over_sz3 ) ) >> 16 );
mac0 = F( (INT64) DQB + ( (INT64) DQA * h_over_sz3 ) );
MAC0 = mac0;
IR0 = Lm_H( mac0, 1 );
}
break;
return 1;
case 0x3d:
GTELOG( pc, "%08x GPF", gteop );
FLAG = 0;
shift = 12 * GTE_SF( gteop );
sf = GTE_SF( gteop );
lm = GTE_LM( gteop );
MAC1 = A1( IR0 * IR1 ) >> shift;
MAC2 = A2( IR0 * IR2 ) >> shift;
MAC3 = A3( IR0 * IR3 ) >> shift;
mac1 = A1( IR0 * IR1 );
mac2 = A2( IR0 * IR2 );
mac3 = A3( IR0 * IR3 );
MAC1 = gte_shift( mac1, sf );
MAC2 = gte_shift( mac2, sf );
MAC3 = gte_shift( mac3, sf );
IR1 = Lm_B1( MAC1, lm );
IR2 = Lm_B2( MAC2, lm );
IR3 = Lm_B3( MAC3, lm );
@ -2873,27 +2969,28 @@ int gte::docop2( UINT32 pc, int gteop )
return 1;
case 0x3e:
if( GTE_OP( gteop ) == 0x1a )
{
GTELOG( pc, "%08x GPL", gteop );
shift = 12 * GTE_SF( gteop );
FLAG = 0;
GTELOG( pc, "%08x GPL", gteop );
FLAG = 0;
MAC1 = A1( ( ( (INT64) MAC1 << shift ) + ( IR0 * IR1 ) ) >> shift );
MAC2 = A2( ( ( (INT64) MAC2 << shift ) + ( IR0 * IR2 ) ) >> shift );
MAC3 = A3( ( ( (INT64) MAC3 << shift ) + ( IR0 * IR3 ) ) >> shift );
IR1 = Lm_B1( MAC1, 0 );
IR2 = Lm_B2( MAC2, 0 );
IR3 = Lm_B3( MAC3, 0 );
RGB0 = RGB1;
RGB1 = RGB2;
CD2 = CODE;
R2 = Lm_C1( MAC1 >> 4 );
G2 = Lm_C2( MAC2 >> 4 );
B2 = Lm_C3( MAC3 >> 4 );
return 1;
}
break;
sf = GTE_SF( gteop );
lm = GTE_LM( gteop );
mac1 = A1( gte_shift( MAC1, -sf ) + ( IR0 * IR1 ) );
mac2 = A2( gte_shift( MAC2, -sf ) + ( IR0 * IR2 ) );
mac3 = A3( gte_shift( MAC3, -sf ) + ( IR0 * IR3 ) );
MAC1 = gte_shift( mac1, sf );
MAC2 = gte_shift( mac2, sf );
MAC3 = gte_shift( mac3, sf );
IR1 = Lm_B1( MAC1, lm );
IR2 = Lm_B2( MAC2, lm );
IR3 = Lm_B3( MAC3, lm );
RGB0 = RGB1;
RGB1 = RGB2;
CD2 = CODE;
R2 = Lm_C1( MAC1 >> 4 );
G2 = Lm_C2( MAC2 >> 4 );
B2 = Lm_C3( MAC3 >> 4 );
return 1;
case 0x3f:
if( gteop == 0x108043f ||

View File

@ -39,7 +39,22 @@ public:
protected:
INT32 LIM( INT32 value, INT32 max, INT32 min, UINT32 flag );
INT64 BOUNDS( INT64 n_value, INT64 n_max, int n_maxflag, INT64 n_min, int n_minflag );
INT64 A1( INT64 a );
INT64 A2( INT64 a );
INT64 A3( INT64 a );
INT32 Lm_B1( INT32 a, int lm );
INT32 Lm_B2( INT32 a, int lm );
INT32 Lm_B3( INT32 a, int lm );
INT32 Lm_B3_sf( INT64 value, int sf, int lm );
INT32 Lm_C1( INT32 a );
INT32 Lm_C2( INT32 a );
INT32 Lm_C3( INT32 a );
INT32 Lm_D( INT32 a );
UINT32 Lm_E( UINT32 result );
INT64 F( INT64 a );
INT32 Lm_G1( INT32 a );
INT32 Lm_G2( INT32 a );
INT32 Lm_H( INT64 value, int sf );
};
#endif