aboutsummaryrefslogtreecommitdiff
path: root/src/GPU3D.cpp
diff options
context:
space:
mode:
Diffstat (limited to 'src/GPU3D.cpp')
-rw-r--r--src/GPU3D.cpp733
1 files changed, 442 insertions, 291 deletions
diff --git a/src/GPU3D.cpp b/src/GPU3D.cpp
index 9881760..72e7179 100644
--- a/src/GPU3D.cpp
+++ b/src/GPU3D.cpp
@@ -49,7 +49,6 @@
//
// formula for clear depth: (GBAtek is wrong there)
// clearZ = (val * 0x200) + 0x1FF;
-// if (clearZ >= 0x010000 && clearZ < 0xFFFFFF) clearZ++;
//
// alpha is 5-bit
//
@@ -58,6 +57,10 @@
// (the idea is that each position matrix has an associated vector matrix)
//
// TODO: check if translate works on the vector matrix? seems pointless
+//
+// viewport Y coordinates are upside-down
+//
+// clear color/depth/bitmap/etc registers (04000350/04000354) are double-buffered
namespace GPU3D
@@ -150,7 +153,8 @@ FIFO<CmdFIFOEntry>* CmdPIPE;
u32 NumCommands, CurCommand, ParamCount, TotalParams;
u32 DispCnt;
-u32 AlphaRef;
+u8 AlphaRefVal;
+u8 AlphaRef;
u16 ToonTable[32];
u16 EdgeTable[8];
@@ -165,6 +169,9 @@ u32 ExecParams[32];
u32 ExecParamCount;
s32 CycleCount;
+u32 NumPushPopCommands;
+u32 NumTestCommands;
+
u32 MatrixMode;
@@ -213,6 +220,9 @@ u32 CurPolygonAttr;
u32 TexParam;
u32 TexPalette;
+s32 PosTestResult[4];
+s16 VecTestResult[3];
+
Vertex TempVertexBuffer[4];
u32 VertexNum;
u32 VertexNumInPoly;
@@ -232,6 +242,7 @@ Polygon* RenderPolygonRAM;
u32 RenderNumPolygons;
u32 ClearAttr1, ClearAttr2;
+u32 RenderClearAttr1, RenderClearAttr2;
u32 FlushRequest;
u32 FlushAttributes;
@@ -266,6 +277,9 @@ void Reset()
ParamCount = 0;
TotalParams = 0;
+ NumPushPopCommands = 0;
+ NumTestCommands = 0;
+
DispCnt = 0;
AlphaRef = 0;
@@ -296,6 +310,9 @@ void Reset()
PosMatrixStackPointer = 0;
TexMatrixStackPointer = 0;
+ memset(PosTestResult, 0, 4*4);
+ memset(VecTestResult, 0, 2*3);
+
VertexNum = 0;
VertexNumInPoly = 0;
@@ -449,44 +466,148 @@ void UpdateClipMatrix()
-template<int comp, s32 plane>
+template<int comp, s32 plane, bool attribs>
void ClipSegment(Vertex* outbuf, Vertex* vout, Vertex* vin)
{
s64 factor_num = vin->Position[3] - (plane*vin->Position[comp]);
s32 factor_den = factor_num - (vout->Position[3] - (plane*vout->Position[comp]));
- Vertex mid;
-#define INTERPOLATE(var) { mid.var = (vin->var + ((vout->var - vin->var) * factor_num) / factor_den); }
+#define INTERPOLATE(var) { outbuf->var = (vin->var + ((vout->var - vin->var) * factor_num) / factor_den); }
if (comp != 0) INTERPOLATE(Position[0]);
if (comp != 1) INTERPOLATE(Position[1]);
if (comp != 2) INTERPOLATE(Position[2]);
INTERPOLATE(Position[3]);
- mid.Position[comp] = plane*mid.Position[3];
+ outbuf->Position[comp] = plane*outbuf->Position[3];
- INTERPOLATE(Color[0]);
- INTERPOLATE(Color[1]);
- INTERPOLATE(Color[2]);
+ if (attribs)
+ {
+ INTERPOLATE(Color[0]);
+ INTERPOLATE(Color[1]);
+ INTERPOLATE(Color[2]);
- INTERPOLATE(TexCoords[0]);
- INTERPOLATE(TexCoords[1]);
+ INTERPOLATE(TexCoords[0]);
+ INTERPOLATE(TexCoords[1]);
+ }
- mid.Clipped = true;
+ outbuf->Clipped = true;
#undef INTERPOLATE
- *outbuf = mid;
+}
+
+template<int comp, bool attribs>
+int ClipAgainstPlane(Vertex* vertices, int nverts, int clipstart)
+{
+ Vertex temp[10];
+ int prev, next;
+ int c = clipstart;
+
+ if (clipstart == 2)
+ {
+ temp[0] = vertices[0];
+ temp[1] = vertices[1];
+ }
+
+ for (int i = clipstart; i < nverts; i++)
+ {
+ prev = i-1; if (prev < 0) prev = nverts-1;
+ next = i+1; if (next >= nverts) next = 0;
+
+ Vertex vtx = vertices[i];
+ if (vtx.Position[comp] > vtx.Position[3])
+ {
+ if ((comp == 2) && (!(CurPolygonAttr & (1<<12)))) return 0;
+
+ Vertex* vprev = &vertices[prev];
+ if (vprev->Position[comp] <= vprev->Position[3])
+ {
+ ClipSegment<comp, 1, attribs>(&temp[c], &vtx, vprev);
+ c++;
+ }
+
+ Vertex* vnext = &vertices[next];
+ if (vnext->Position[comp] <= vnext->Position[3])
+ {
+ ClipSegment<comp, 1, attribs>(&temp[c], &vtx, vnext);
+ c++;
+ }
+ }
+ else
+ temp[c++] = vtx;
+ }
+
+ nverts = c; c = clipstart;
+ for (int i = clipstart; i < nverts; i++)
+ {
+ prev = i-1; if (prev < 0) prev = nverts-1;
+ next = i+1; if (next >= nverts) next = 0;
+
+ Vertex vtx = temp[i];
+ if (vtx.Position[comp] < -vtx.Position[3])
+ {
+ Vertex* vprev = &temp[prev];
+ if (vprev->Position[comp] >= -vprev->Position[3])
+ {
+ ClipSegment<comp, -1, attribs>(&vertices[c], &vtx, vprev);
+ c++;
+ }
+
+ Vertex* vnext = &temp[next];
+ if (vnext->Position[comp] >= -vnext->Position[3])
+ {
+ ClipSegment<comp, -1, attribs>(&vertices[c], &vtx, vnext);
+ c++;
+ }
+ }
+ else
+ vertices[c++] = vtx;
+ }
+
+ // checkme
+ for (int i = 0; i < c; i++)
+ {
+ Vertex* vtx = &vertices[i];
+
+ vtx->Color[0] &= ~0xFFF; vtx->Color[0] += 0xFFF;
+ vtx->Color[1] &= ~0xFFF; vtx->Color[1] += 0xFFF;
+ vtx->Color[2] &= ~0xFFF; vtx->Color[2] += 0xFFF;
+ }
+
+ return c;
+}
+
+template<bool attribs>
+int ClipPolygon(Vertex* vertices, int nverts, int clipstart)
+{
+ // clip.
+ // for each vertex:
+ // if it's outside, check if the previous and next vertices are inside
+ // if so, place a new vertex at the edge of the view volume
+
+ // TODO: check for 1-dot polygons
+ // TODO: the hardware seems to use a different algorithm. it reacts differently to vertices with W=0
+
+ // X clipping
+ nverts = ClipAgainstPlane<0, attribs>(vertices, nverts, clipstart);
+
+ // Y clipping
+ nverts = ClipAgainstPlane<1, attribs>(vertices, nverts, clipstart);
+
+ // Z clipping
+ nverts = ClipAgainstPlane<2, attribs>(vertices, nverts, clipstart);
+
+ return nverts;
}
void SubmitPolygon()
{
- Vertex clippedvertices[2][10];
+ Vertex clippedvertices[10];
Vertex* reusedvertices[2];
int clipstart = 0;
int lastpolyverts = 0;
int nverts = PolygonMode & 0x1 ? 4:3;
int prev, next;
- int c;
// culling
@@ -500,7 +621,7 @@ void SubmitPolygon()
normalX = (((s64)v0->Position[1] * v2->Position[3]) - ((s64)v0->Position[3] * v2->Position[1])) >> 12;
normalY = (((s64)v0->Position[3] * v2->Position[0]) - ((s64)v0->Position[0] * v2->Position[3])) >> 12;
normalZ = (((s64)v0->Position[0] * v2->Position[1]) - ((s64)v0->Position[1] * v2->Position[0])) >> 12;
- dot = ((s64)(v1->Position[0] >> 0) * normalX) + ((s64)(v1->Position[1] >> 0) * normalY) + ((s64)(v1->Position[3] >> 0) * normalZ);
+ dot = ((s64)v1->Position[0] * normalX) + ((s64)v1->Position[1] * normalY) + ((s64)v1->Position[3] * normalZ);
bool facingview = (dot < 0);
@@ -558,225 +679,21 @@ void SubmitPolygon()
reusedvertices[0] = LastStripPolygon->Vertices[id0];
reusedvertices[1] = LastStripPolygon->Vertices[id1];
- clippedvertices[0][0] = *reusedvertices[0];
- clippedvertices[0][1] = *reusedvertices[1];
- clippedvertices[1][0] = *reusedvertices[0];
- clippedvertices[1][1] = *reusedvertices[1];
+ clippedvertices[0] = *reusedvertices[0];
+ clippedvertices[1] = *reusedvertices[1];
clipstart = 2;
}
}
- // clip.
- // for each vertex:
- // if it's outside, check if the previous and next vertices are inside
- // if so, place a new vertex at the edge of the view volume
-
- // X clipping
-
- c = clipstart;
- for (int i = clipstart; i < nverts; i++)
- {
- prev = i-1; if (prev < 0) prev = nverts-1;
- next = i+1; if (next >= nverts) next = 0;
-
- Vertex vtx = TempVertexBuffer[i];
- if (vtx.Position[0] > vtx.Position[3])
- {
- Vertex* vprev = &TempVertexBuffer[prev];
- if (vprev->Position[0] <= vprev->Position[3])
- {
- ClipSegment<0, 1>(&clippedvertices[0][c], &vtx, vprev);
- c++;
- }
-
- Vertex* vnext = &TempVertexBuffer[next];
- if (vnext->Position[0] <= vnext->Position[3])
- {
- ClipSegment<0, 1>(&clippedvertices[0][c], &vtx, vnext);
- c++;
- }
- }
- else
- clippedvertices[0][c++] = vtx;
- }
-
- nverts = c; c = clipstart;
for (int i = clipstart; i < nverts; i++)
- {
- prev = i-1; if (prev < 0) prev = nverts-1;
- next = i+1; if (next >= nverts) next = 0;
+ clippedvertices[i] = TempVertexBuffer[i];
- Vertex vtx = clippedvertices[0][i];
- if (vtx.Position[0] < -vtx.Position[3])
- {
- Vertex* vprev = &clippedvertices[0][prev];
- if (vprev->Position[0] >= -vprev->Position[3])
- {
- ClipSegment<0, -1>(&clippedvertices[1][c], &vtx, vprev);
- c++;
- }
+ // clipping
- Vertex* vnext = &clippedvertices[0][next];
- if (vnext->Position[0] >= -vnext->Position[3])
- {
- ClipSegment<0, -1>(&clippedvertices[1][c], &vtx, vnext);
- c++;
- }
- }
- else
- clippedvertices[1][c++] = vtx;
- }
+ nverts = ClipPolygon<true>(clippedvertices, nverts, clipstart);
- for (int i = 0; i < c; i++)
- {
- Vertex* vtx = &clippedvertices[1][i];
-
- vtx->Color[0] &= ~0xFFF; vtx->Color[0] += 0xFFF;
- vtx->Color[1] &= ~0xFFF; vtx->Color[1] += 0xFFF;
- vtx->Color[2] &= ~0xFFF; vtx->Color[2] += 0xFFF;
- }
-
- // Y clipping
-
- nverts = c; c = clipstart;
- for (int i = clipstart; i < nverts; i++)
- {
- prev = i-1; if (prev < 0) prev = nverts-1;
- next = i+1; if (next >= nverts) next = 0;
-
- Vertex vtx = clippedvertices[1][i];
- if (vtx.Position[1] > vtx.Position[3])
- {
- Vertex* vprev = &clippedvertices[1][prev];
- if (vprev->Position[1] <= vprev->Position[3])
- {
- ClipSegment<1, 1>(&clippedvertices[0][c], &vtx, vprev);
- c++;
- }
-
- Vertex* vnext = &clippedvertices[1][next];
- if (vnext->Position[1] <= vnext->Position[3])
- {
- ClipSegment<1, 1>(&clippedvertices[0][c], &vtx, vnext);
- c++;
- }
- }
- else
- clippedvertices[0][c++] = vtx;
- }
-
- nverts = c; c = clipstart;
- for (int i = clipstart; i < nverts; i++)
- {
- prev = i-1; if (prev < 0) prev = nverts-1;
- next = i+1; if (next >= nverts) next = 0;
-
- Vertex vtx = clippedvertices[0][i];
- if (vtx.Position[1] < -vtx.Position[3])
- {
- Vertex* vprev = &clippedvertices[0][prev];
- if (vprev->Position[1] >= -vprev->Position[3])
- {
- ClipSegment<1, -1>(&clippedvertices[1][c], &vtx, vprev);
- c++;
- }
-
- Vertex* vnext = &clippedvertices[0][next];
- if (vnext->Position[1] >= -vnext->Position[3])
- {
- ClipSegment<1, -1>(&clippedvertices[1][c], &vtx, vnext);
- c++;
- }
- }
- else
- clippedvertices[1][c++] = vtx;
- }
-
- for (int i = 0; i < c; i++)
- {
- Vertex* vtx = &clippedvertices[1][i];
-
- vtx->Color[0] &= ~0xFFF; vtx->Color[0] += 0xFFF;
- vtx->Color[1] &= ~0xFFF; vtx->Color[1] += 0xFFF;
- vtx->Color[2] &= ~0xFFF; vtx->Color[2] += 0xFFF;
- }
-
- // Z clipping
-
- bool farplaneclip = false;
- nverts = c; c = clipstart;
- for (int i = clipstart; i < nverts; i++)
- {
- prev = i-1; if (prev < 0) prev = nverts-1;
- next = i+1; if (next >= nverts) next = 0;
-
- Vertex vtx = clippedvertices[1][i];
- if (vtx.Position[2] > vtx.Position[3])
- {
- farplaneclip = true;
-
- Vertex* vprev = &clippedvertices[1][prev];
- if (vprev->Position[2] <= vprev->Position[3])
- {
- ClipSegment<2, 1>(&clippedvertices[0][c], &vtx, vprev);
- c++;
- }
-
- Vertex* vnext = &clippedvertices[1][next];
- if (vnext->Position[2] <= vnext->Position[3])
- {
- ClipSegment<2, 1>(&clippedvertices[0][c], &vtx, vnext);
- c++;
- }
- }
- else
- clippedvertices[0][c++] = vtx;
- }
-
- if (farplaneclip && (!(CurPolygonAttr & (1<<12))))
- {
- LastStripPolygon = NULL;
- return;
- }
-
- nverts = c; c = clipstart;
- for (int i = clipstart; i < nverts; i++)
- {
- prev = i-1; if (prev < 0) prev = nverts-1;
- next = i+1; if (next >= nverts) next = 0;
-
- Vertex vtx = clippedvertices[0][i];
- if (vtx.Position[2] < -vtx.Position[3])
- {
- Vertex* vprev = &clippedvertices[0][prev];
- if (vprev->Position[2] >= -vprev->Position[3])
- {
- ClipSegment<2, -1>(&clippedvertices[1][c], &vtx, vprev);
- c++;
- }
-
- Vertex* vnext = &clippedvertices[0][next];
- if (vnext->Position[2] >= -vnext->Position[3])
- {
- ClipSegment<2, -1>(&clippedvertices[1][c], &vtx, vnext);
- c++;
- }
- }
- else
- clippedvertices[1][c++] = vtx;
- }
-
- for (int i = 0; i < c; i++)
- {
- Vertex* vtx = &clippedvertices[1][i];
-
- vtx->Color[0] &= ~0xFFF; vtx->Color[0] += 0xFFF;
- vtx->Color[1] &= ~0xFFF; vtx->Color[1] += 0xFFF;
- vtx->Color[2] &= ~0xFFF; vtx->Color[2] += 0xFFF;
- }
-
- if (c == 0)
+ if (nverts == 0)
{
LastStripPolygon = NULL;
return;
@@ -784,10 +701,10 @@ void SubmitPolygon()
// build the actual polygon
- if (NumPolygons >= 2048 || NumVertices+c > 6144)
+ if (NumPolygons >= 2048 || NumVertices+nverts > 6144)
{
LastStripPolygon = NULL;
- // TODO: set DISP3DCNT overflow flag
+ DispCnt |= (1<<13);
return;
}
@@ -802,11 +719,19 @@ void SubmitPolygon()
u32 texfmt = (TexParam >> 26) & 0x7;
u32 polyalpha = (CurPolygonAttr >> 16) & 0x1F;
- poly->Translucent = (texfmt == 1 || texfmt == 6 || (polyalpha > 0 && polyalpha < 31));
+ poly->Translucent = ((texfmt == 1 || texfmt == 6) && !(CurPolygonAttr & 0x10)) || (polyalpha > 0 && polyalpha < 31);
+
+ poly->IsShadowMask = ((CurPolygonAttr & 0x3F000030) == 0x00000030);
+ if ((NumPolygons == 1) || (!CurPolygonRAM[NumPolygons-2].IsShadowMask))
+ poly->ClearStencil = poly->IsShadowMask;
+ else
+ poly->ClearStencil = false;
+
+ poly->IsShadow = ((CurPolygonAttr & 0x30) == 0x30) && !poly->IsShadowMask;
if (LastStripPolygon && clipstart > 0)
{
- if (c == lastpolyverts)
+ if (nverts == lastpolyverts)
{
poly->Vertices[0] = reusedvertices[0];
poly->Vertices[1] = reusedvertices[1];
@@ -826,10 +751,10 @@ void SubmitPolygon()
poly->NumVertices += 2;
}
- for (int i = clipstart; i < c; i++)
+ for (int i = clipstart; i < nverts; i++)
{
Vertex* vtx = &CurVertexRAM[NumVertices];
- *vtx = clippedvertices[1][i];
+ *vtx = clippedvertices[i];
poly->Vertices[i] = vtx;
NumVertices++;
@@ -847,24 +772,29 @@ void SubmitPolygon()
}
else
{
+ // W is normalized, such that all the polygon's W values fit within 16 bits
+ // the viewport transform for X and Y uses the original W values, but
+ // the transform for Z uses the normalized W values
+ // W normalization is applied to separate polygons, even within strips
+
posX = (((s64)(vtx->Position[0] + w) * Viewport[2]) / (((s64)w) << 1)) + Viewport[0];
posY = (((s64)(-vtx->Position[1] + w) * Viewport[3]) / (((s64)w) << 1)) + Viewport[1];
- if (FlushAttributes & 0x2) posZ = w;
- else posZ = (((s64)vtx->Position[2] * 0x800000) / w) + 0x7FFEFF;
+ //if (FlushAttributes & 0x2) posZ = w;
+ //else posZ = (((s64)vtx->Position[2] * 0x800000) / w) + 0x7FFEFF;
}
if (posX < 0) posX = 0;
else if (posX > 256) posX = 256;
if (posY < 0) posY = 0;
else if (posY > 192) posY = 192;
- if (posZ < 0) posZ = 0;
- else if (posZ > 0xFFFFFF) posZ = 0xFFFFFF;
+ //if (posZ < 0) posZ = 0;
+ //else if (posZ > 0xFFFFFF) posZ = 0xFFFFFF;
vtx->FinalPosition[0] = posX;
vtx->FinalPosition[1] = posY;
- vtx->FinalPosition[2] = posZ;
- vtx->FinalPosition[3] = w;
+ //vtx->FinalPosition[2] = posZ;
+ //vtx->FinalPosition[3] = w;
vtx->FinalColor[0] = vtx->Color[0] >> 12;
if (vtx->FinalColor[0]) vtx->FinalColor[0] = ((vtx->FinalColor[0] << 4) + 0xF);
@@ -875,11 +805,15 @@ void SubmitPolygon()
}
// determine bounds of the polygon
+ // also determine the W shift and normalize W
+ // TODO: normalization works both ways
+
u32 vtop = 0, vbot = 0;
s32 ytop = 192, ybot = 0;
s32 xtop = 256, xbot = 0;
+ u32 wshift = 0;
- for (int i = 0; i < c; i++)
+ for (int i = 0; i < nverts; i++)
{
Vertex* vtx = poly->Vertices[i];
@@ -895,11 +829,36 @@ void SubmitPolygon()
ybot = vtx->FinalPosition[1];
vbot = i;
}
+
+ u32 w = (u32)vtx->Position[3];
+ while ((w >> wshift) & 0xFFFF0000)
+ wshift += 4;
}
poly->VTop = vtop; poly->VBottom = vbot;
poly->YTop = ytop; poly->YBottom = ybot;
poly->XTop = xtop; poly->XBottom = xbot;
+ poly->WShift = wshift;
+ poly->WBuffer = (FlushAttributes & 0x2);
+
+ for (int i = 0; i < nverts; i++)
+ {
+ Vertex* vtx = poly->Vertices[i];
+ s32 w = vtx->Position[3] >> wshift;
+
+ s32 z;
+ if (FlushAttributes & 0x2)
+ z = w << wshift;
+ else
+ z = (((s64)vtx->Position[2] * 0x800000) / (w << wshift)) + 0x7FFEFF;
+
+ // checkme
+ if (z < 0) z = 0;
+ else if (z > 0xFFFFFF) z = 0xFFFFFF;
+
+ poly->FinalZ[i] = z;
+ poly->FinalW[i] = w;
+ }
if (PolygonMode >= 2)
LastStripPolygon = poly;
@@ -926,8 +885,8 @@ void SubmitVertex()
if ((TexParam >> 30) == 3)
{
- vertextrans->TexCoords[0] = (vertex[0]*TexMatrix[0] + vertex[1]*TexMatrix[4] + vertex[2]*TexMatrix[8] + vertex[3]*(RawTexCoords[0]<<8)) >> 20;
- vertextrans->TexCoords[1] = (vertex[0]*TexMatrix[1] + vertex[1]*TexMatrix[5] + vertex[2]*TexMatrix[9] + vertex[3]*(RawTexCoords[1]<<8)) >> 20;
+ vertextrans->TexCoords[0] = ((vertex[0]*TexMatrix[0] + vertex[1]*TexMatrix[4] + vertex[2]*TexMatrix[8]) >> 24) + RawTexCoords[0];
+ vertextrans->TexCoords[1] = ((vertex[0]*TexMatrix[1] + vertex[1]*TexMatrix[5] + vertex[2]*TexMatrix[9]) >> 24) + RawTexCoords[1];
}
else
{
@@ -1004,6 +963,10 @@ void SubmitVertex()
s32 CalculateLighting()
{
+ // TODO: this requires matrix mode 2, apparently
+ // hardware seems to read garbage when matrix mode isn't 2
+ // also, non-normal normals seem to be treated as zero? or overflow to negative?
+
if ((TexParam >> 30) == 2)
{
TexCoords[0] = RawTexCoords[0] + (((s64)Normal[0]*TexMatrix[0] + (s64)Normal[1]*TexMatrix[4] + (s64)Normal[2]*TexMatrix[8]) >> 21);
@@ -1070,6 +1033,134 @@ s32 CalculateLighting()
}
+void BoxTest(u32* params)
+{
+ Vertex cube[8];
+ Vertex face[10];
+ int res;
+
+ GXStat &= ~(1<<1);
+
+ s32 x0 = (s32)(s16)(params[0] & 0xFFFF);
+ s32 y0 = ((s32)params[0]) >> 16;
+ s32 z0 = (s32)(s16)(params[1] & 0xFFFF);
+ s32 x1 = ((s32)params[1]) >> 16;
+ s32 y1 = (s32)(s16)(params[2] & 0xFFFF);
+ s32 z1 = ((s32)params[2]) >> 16;
+
+ x1 += x0;
+ y1 += y0;
+ z1 += z0;
+
+ cube[0].Position[0] = x0; cube[0].Position[1] = y0; cube[0].Position[2] = z0;
+ cube[1].Position[0] = x1; cube[1].Position[1] = y0; cube[1].Position[2] = z0;
+ cube[2].Position[0] = x1; cube[2].Position[1] = y1; cube[2].Position[2] = z0;
+ cube[3].Position[0] = x0; cube[3].Position[1] = y1; cube[3].Position[2] = z0;
+ cube[4].Position[0] = x0; cube[4].Position[1] = y1; cube[4].Position[2] = z1;
+ cube[5].Position[0] = x0; cube[5].Position[1] = y0; cube[5].Position[2] = z1;
+ cube[6].Position[0] = x1; cube[6].Position[1] = y0; cube[6].Position[2] = z1;
+ cube[7].Position[0] = x1; cube[7].Position[1] = y1; cube[7].Position[2] = z1;
+
+ UpdateClipMatrix();
+ for (int i = 0; i < 8; i++)
+ {
+ s32 x = cube[i].Position[0];
+ s32 y = cube[i].Position[1];
+ s32 z = cube[i].Position[2];
+
+ cube[i].Position[0] = ((s64)x*ClipMatrix[0] + (s64)y*ClipMatrix[4] + (s64)z*ClipMatrix[8] + 0x1000*ClipMatrix[12]) >> 12;
+ cube[i].Position[1] = ((s64)x*ClipMatrix[1] + (s64)y*ClipMatrix[5] + (s64)z*ClipMatrix[9] + 0x1000*ClipMatrix[13]) >> 12;
+ cube[i].Position[2] = ((s64)x*ClipMatrix[2] + (s64)y*ClipMatrix[6] + (s64)z*ClipMatrix[10] + 0x1000*ClipMatrix[14]) >> 12;
+ cube[i].Position[3] = ((s64)x*ClipMatrix[3] + (s64)y*ClipMatrix[7] + (s64)z*ClipMatrix[11] + 0x1000*ClipMatrix[15]) >> 12;
+ }
+
+ // front face (-Z)
+ face[0] = cube[0]; face[1] = cube[1]; face[2] = cube[2]; face[3] = cube[3];
+ res = ClipPolygon<false>(face, 4, 0);
+ if (res > 0)
+ {
+ GXStat |= (1<<1);
+ return;
+ }
+
+ // back face (+Z)
+ face[0] = cube[4]; face[1] = cube[5]; face[2] = cube[6]; face[3] = cube[7];
+ res = ClipPolygon<false>(face, 4, 0);
+ if (res > 0)
+ {
+ GXStat |= (1<<1);
+ return;
+ }
+
+ // left face (-X)
+ face[0] = cube[0]; face[1] = cube[3]; face[2] = cube[4]; face[3] = cube[5];
+ res = ClipPolygon<false>(face, 4, 0);
+ if (res > 0)
+ {
+ GXStat |= (1<<1);
+ return;
+ }
+
+ // right face (+X)
+ face[0] = cube[1]; face[1] = cube[2]; face[2] = cube[7]; face[3] = cube[6];
+ res = ClipPolygon<false>(face, 4, 0);
+ if (res > 0)
+ {
+ GXStat |= (1<<1);
+ return;
+ }
+
+ // bottom face (-Y)
+ face[0] = cube[0]; face[1] = cube[1]; face[2] = cube[6]; face[3] = cube[5];
+ res = ClipPolygon<false>(face, 4, 0);
+ if (res > 0)
+ {
+ GXStat |= (1<<1);
+ return;
+ }
+
+ // top face (+Y)
+ face[0] = cube[2]; face[1] = cube[3]; face[2] = cube[4]; face[3] = cube[7];
+ res = ClipPolygon<false>(face, 4, 0);
+ if (res > 0)
+ {
+ GXStat |= (1<<1);
+ return;
+ }
+}
+
+void PosTest()
+{
+ s64 vertex[4] = {(s64)CurVertex[0], (s64)CurVertex[1], (s64)CurVertex[2], 0x1000};
+
+ UpdateClipMatrix();
+ PosTestResult[0] = (vertex[0]*ClipMatrix[0] + vertex[1]*ClipMatrix[4] + vertex[2]*ClipMatrix[8] + vertex[3]*ClipMatrix[12]) >> 12;
+ PosTestResult[1] = (vertex[0]*ClipMatrix[1] + vertex[1]*ClipMatrix[5] + vertex[2]*ClipMatrix[9] + vertex[3]*ClipMatrix[13]) >> 12;
+ PosTestResult[2] = (vertex[0]*ClipMatrix[2] + vertex[1]*ClipMatrix[6] + vertex[2]*ClipMatrix[10] + vertex[3]*ClipMatrix[14]) >> 12;
+ PosTestResult[3] = (vertex[0]*ClipMatrix[3] + vertex[1]*ClipMatrix[7] + vertex[2]*ClipMatrix[11] + vertex[3]*ClipMatrix[15]) >> 12;
+}
+
+void VecTest(u32* params)
+{
+ // TODO: apparently requires matrix mode 2
+ // TODO: maybe it overwrites the normal registers, too
+
+ s16 normal[3];
+
+ normal[0] = (s16)((params[0] & 0x000003FF) << 6) >> 6;
+ normal[1] = (s16)((params[0] & 0x000FFC00) >> 4) >> 6;
+ normal[2] = (s16)((params[0] & 0x3FF00000) >> 14) >> 6;
+
+ VecTestResult[0] = (normal[0]*VecMatrix[0] + normal[1]*VecMatrix[4] + normal[2]*VecMatrix[8]) >> 9;
+ VecTestResult[1] = (normal[0]*VecMatrix[1] + normal[1]*VecMatrix[5] + normal[2]*VecMatrix[9]) >> 9;
+ VecTestResult[2] = (normal[0]*VecMatrix[2] + normal[1]*VecMatrix[6] + normal[2]*VecMatrix[10]) >> 9;
+
+ if (VecTestResult[0] & 0x1000) VecTestResult[0] |= 0xF000;
+ if (VecTestResult[1] & 0x1000) VecTestResult[1] |= 0xF000;
+ if (VecTestResult[2] & 0x1000) VecTestResult[2] |= 0xF000;
+}
+
+
void CmdFIFOWrite(CmdFIFOEntry& entry)
{
@@ -1096,6 +1187,17 @@ void CmdFIFOWrite(CmdFIFOEntry& entry)
CmdFIFO->Write(entry);
}
+
+ if (entry.Command == 0x11 || entry.Command == 0x12)
+ {
+ GXStat |= (1<<14); // push/pop matrix
+ NumPushPopCommands++;
+ }
+ else if (entry.Command == 0x70 || entry.Command == 0x71 || entry.Command == 0x72)
+ {
+ GXStat |= (1<<0); // box/pos/vec test
+ NumTestCommands++;
+ }
}
CmdFIFOEntry CmdFIFORead()
@@ -1132,7 +1234,6 @@ void ExecuteCommand()
CycleCount += CmdNumCycles[entry.Command];
ExecParamCount = 0;
- GXStat &= ~(1<<14);
if (CycleCount > 0)
GXStat |= (1<<27);
@@ -1143,6 +1244,7 @@ void ExecuteCommand()
break;
case 0x11: // push matrix
+ NumPushPopCommands--;
if (MatrixMode == 0)
{
if (ProjMatrixStackPointer > 0)
@@ -1154,7 +1256,6 @@ void ExecuteCommand()
memcpy(ProjMatrixStack, ProjMatrix, 16*4);
ProjMatrixStackPointer++;
- GXStat |= (1<<14);
}
else if (MatrixMode == 3)
{
@@ -1167,7 +1268,6 @@ void ExecuteCommand()
memcpy(TexMatrixStack, TexMatrix, 16*4);
TexMatrixStackPointer++;
- GXStat |= (1<<14);
}
else
{
@@ -1181,11 +1281,11 @@ void ExecuteCommand()
memcpy(PosMatrixStack[PosMatrixStackPointer], PosMatrix, 16*4);
memcpy(VecMatrixStack[PosMatrixStackPointer], VecMatrix, 16*4);
PosMatrixStackPointer++;
- GXStat |= (1<<14);
}
break;
case 0x12: // pop matrix
+ NumPushPopCommands--;
if (MatrixMode == 0)
{
if (ProjMatrixStackPointer <= 0)
@@ -1197,7 +1297,6 @@ void ExecuteCommand()
ProjMatrixStackPointer--;
memcpy(ProjMatrix, ProjMatrixStack, 16*4);
- GXStat |= (1<<14);
ClipMatrixDirty = true;
}
else if (MatrixMode == 3)
@@ -1211,7 +1310,6 @@ void ExecuteCommand()
TexMatrixStackPointer--;
memcpy(TexMatrix, TexMatrixStack, 16*4);
- GXStat |= (1<<14);
}
else
{
@@ -1228,7 +1326,6 @@ void ExecuteCommand()
memcpy(PosMatrix, PosMatrixStack[PosMatrixStackPointer], 16*4);
memcpy(VecMatrix, VecMatrixStack[PosMatrixStackPointer], 16*4);
- GXStat |= (1<<14);
ClipMatrixDirty = true;
}
break;
@@ -1587,10 +1684,29 @@ void ExecuteCommand()
break;
case 0x60: // viewport x1,y1,x2,y2
+ // note: viewport Y coordinates are upside-down
Viewport[0] = ExecParams[0] & 0xFF;
- Viewport[1] = (ExecParams[0] >> 8) & 0xFF;
+ Viewport[1] = 191 - (ExecParams[0] >> 24);
Viewport[2] = ((ExecParams[0] >> 16) & 0xFF) - Viewport[0] + 1;
- Viewport[3] = (ExecParams[0] >> 24) - Viewport[1] + 1;
+ Viewport[3] = (191 - ((ExecParams[0] >> 8) & 0xFF)) - Viewport[1] + 1;
+ break;
+
+ case 0x70: // box test
+ NumTestCommands -= 3;
+ BoxTest(ExecParams);
+ break;
+
+ case 0x71: // pos test
+ NumTestCommands -= 2;
+ CurVertex[0] = ExecParams[0] & 0xFFFF;
+ CurVertex[1] = ExecParams[0] >> 16;
+ CurVertex[2] = ExecParams[1] & 0xFFFF;
+ PosTest();
+ break;
+
+ case 0x72: // vec test
+ NumTestCommands--;
+ VecTest(ExecParams);
break;
default:
@@ -1613,13 +1729,21 @@ void Run(s32 cycles)
if (CycleCount <= 0)
{
while (CycleCount <= 0 && !CmdPIPE->IsEmpty())
+ {
+ if (NumPushPopCommands == 0) GXStat &= ~(1<<14);
+ if (NumTestCommands == 0) GXStat &= ~(1<<0);
+
ExecuteCommand();
+ }
}
if (CycleCount <= 0 && CmdPIPE->IsEmpty())
{
CycleCount = 0;
- GXStat &= ~((1<<27)|(1<<14));
+ GXStat &= ~(1<<27);
+
+ if (NumPushPopCommands == 0) GXStat &= ~(1<<14);
+ if (NumTestCommands == 0) GXStat &= ~(1<<0);
}
}
@@ -1652,6 +1776,10 @@ void VBlank()
RenderPolygonRAM = CurPolygonRAM;
RenderNumPolygons = NumPolygons;
+ // TODO: find out which other registers are latched for rendering
+ RenderClearAttr1 = ClearAttr1;
+ RenderClearAttr2 = ClearAttr2;
+
CurRAMBank = CurRAMBank?0:1;
CurVertexRAM = &VertexRAM[CurRAMBank ? 6144 : 0];
CurPolygonRAM = &PolygonRAM[CurRAMBank ? 2048 : 0];
@@ -1683,6 +1811,45 @@ u32* GetLine(int line)
}
+void WriteToGXFIFO(u32 val)
+{
+ if (NumCommands == 0)
+ {
+ NumCommands = 4;
+ CurCommand = val;
+ ParamCount = 0;
+ TotalParams = CmdNumParams[CurCommand & 0xFF];
+
+ if (TotalParams > 0) return;
+ }
+ else
+ ParamCount++;
+
+ for (;;)
+ {
+ if ((CurCommand & 0xFF) || (NumCommands == 4 && CurCommand == 0))
+ {
+ CmdFIFOEntry entry;
+ entry.Command = CurCommand & 0xFF;
+ entry.Param = val;
+ CmdFIFOWrite(entry);
+ }
+
+ if (ParamCount >= TotalParams)
+ {
+ CurCommand >>= 8;
+ NumCommands--;
+ if (NumCommands == 0) break;
+
+ ParamCount = 0;
+ TotalParams = CmdNumParams[CurCommand & 0xFF];
+ }
+ if (ParamCount < TotalParams)
+ break;
+ }
+}
+
+
u8 Read8(u32 addr)
{
printf("unknown GPU3D read8 %08X\n", addr);
@@ -1703,6 +1870,10 @@ u16 Read16(u32 addr)
return NumPolygons;
case 0x04000606:
return NumVertices;
+
+ case 0x04000630: return VecTestResult[0];
+ case 0x04000632: return VecTestResult[1];
+ case 0x04000634: return VecTestResult[2];
}
printf("unknown GPU3D read16 %08X\n", addr);
@@ -1734,6 +1905,11 @@ u32 Read32(u32 addr)
case 0x04000604:
return NumPolygons | (NumVertices << 16);
+ case 0x04000620: return PosTestResult[0];
+ case 0x04000624: return PosTestResult[1];
+ case 0x04000628: return PosTestResult[2];
+ case 0x0400062C: return PosTestResult[3];
+
case 0x04000680: return VecMatrix[0];
case 0x04000684: return VecMatrix[1];
case 0x04000688: return VecMatrix[2];
@@ -1760,7 +1936,8 @@ void Write8(u32 addr, u8 val)
switch (addr)
{
case 0x04000340:
- AlphaRef = val & 0x1F;
+ AlphaRefVal = val & 0x1F;
+ AlphaRef = (DispCnt & (1<<2)) ? AlphaRefVal : 0;
return;
}
@@ -1778,11 +1955,15 @@ void Write16(u32 addr, u16 val)
switch (addr)
{
case 0x04000060:
- DispCnt = val;
+ DispCnt = (val & 0x4FFF) | (DispCnt & 0x3000);
+ if (val & (1<<12)) DispCnt &= ~(1<<12);
+ if (val & (1<<13)) DispCnt &= ~(1<<13);
+ AlphaRef = (DispCnt & (1<<2)) ? AlphaRefVal : 0;
return;
case 0x04000340:
- AlphaRef = val & 0x1F;
+ AlphaRefVal = val & 0x1F;
+ AlphaRef = (DispCnt & (1<<2)) ? AlphaRefVal : 0;
return;
case 0x04000350:
@@ -1837,11 +2018,15 @@ void Write32(u32 addr, u32 val)
switch (addr)
{
case 0x04000060:
- DispCnt = val & 0xFFFF;
+ DispCnt = (val & 0x4FFF) | (DispCnt & 0x3000);
+ if (val & (1<<12)) DispCnt &= ~(1<<12);
+ if (val & (1<<13)) DispCnt &= ~(1<<13);
+ AlphaRef = (DispCnt & (1<<2)) ? AlphaRefVal : 0;
return;
case 0x04000340:
- AlphaRef = val & 0x1F;
+ AlphaRefVal = val & 0x1F;
+ AlphaRef = (DispCnt & (1<<2)) ? AlphaRefVal : 0;
return;
case 0x04000350:
@@ -1875,41 +2060,7 @@ void Write32(u32 addr, u32 val)
if (addr >= 0x04000400 && addr < 0x04000440)
{
- if (NumCommands == 0)
- {
- NumCommands = 4;
- CurCommand = val;
- ParamCount = 0;
- TotalParams = CmdNumParams[CurCommand & 0xFF];
-
- if (TotalParams > 0) return;
- }
- else
- ParamCount++;
-
- for (;;)
- {
- if ((CurCommand & 0xFF) || (NumCommands == 4 && CurCommand == 0))
- {
- CmdFIFOEntry entry;
- entry.Command = CurCommand & 0xFF;
- entry.Param = val;
- CmdFIFOWrite(entry);
- }
-
- if (ParamCount >= TotalParams)
- {
- CurCommand >>= 8;
- NumCommands--;
- if (NumCommands == 0) break;
-
- ParamCount = 0;
- TotalParams = CmdNumParams[CurCommand & 0xFF];
- }
- if (ParamCount < TotalParams)
- break;
- }
-
+ WriteToGXFIFO(val);
return;
}