/* Copyright 2016-2023 melonDS team This file is part of melonDS. melonDS is free software: you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation, either version 3 of the License, or (at your option) any later version. melonDS is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with melonDS. If not, see http://www.gnu.org/licenses/. */ #ifndef GPU3D_H #define GPU3D_H #include #include #include "Savestate.h" #include "FIFO.h" namespace melonDS { class GPU; struct Vertex { s32 Position[4]; s32 Color[3]; s16 TexCoords[2]; bool Clipped; // final vertex attributes. // allows them to be reused in polygon strips. s32 FinalPosition[2]; s32 FinalColor[3]; // hi-res position (4-bit fractional part) // TODO maybe: hi-res color? (that survives clipping) s32 HiresPosition[2]; }; struct Polygon { Vertex* Vertices[10]; u32 NumVertices; s32 FinalZ[10]; s32 FinalW[10]; bool WBuffer; u32 Attr; u32 TexParam; u32 TexPalette; bool Degenerate; bool FacingView; bool Translucent; bool IsShadowMask; bool IsShadow; int Type; // 0=regular 1=line u32 VTop, VBottom; // vertex indices s32 YTop, YBottom; // Y coords s32 XTop, XBottom; // associated X coords u32 SortKey; }; class Renderer3D; class NDS; class GPU3D { public: GPU3D(melonDS::NDS& nds, std::unique_ptr&& renderer = nullptr) noexcept; ~GPU3D() noexcept = default; void Reset() noexcept; void DoSavestate(Savestate* file) noexcept; void SetEnabled(bool geometry, bool rendering) noexcept; void ExecuteCommand() noexcept; s32 CyclesToRunFor() const noexcept; void Run() noexcept; void CheckFIFOIRQ() noexcept; void CheckFIFODMA() noexcept; void VCount144(GPU& gpu) noexcept; void VBlank() noexcept; void VCount215(GPU& gpu) noexcept; void RestartFrame(GPU& gpu) noexcept; void Stop(const GPU& gpu) noexcept; void SetRenderXPos(u16 xpos) noexcept; [[nodiscard]] u16 GetRenderXPos() const noexcept { return RenderXPos; } u32* GetLine(int line) noexcept; void WriteToGXFIFO(u32 val) noexcept; [[nodiscard]] bool IsRendererAccelerated() const noexcept; [[nodiscard]] Renderer3D& GetCurrentRenderer() noexcept { return *CurrentRenderer; } [[nodiscard]] const Renderer3D& GetCurrentRenderer() const noexcept { return *CurrentRenderer; } void SetCurrentRenderer(std::unique_ptr&& renderer) noexcept { CurrentRenderer = std::move(renderer); } u8 Read8(u32 addr) noexcept; u16 Read16(u32 addr) noexcept; u32 Read32(u32 addr) noexcept; void Write8(u32 addr, u8 val) noexcept; void Write16(u32 addr, u16 val) noexcept; void Write32(u32 addr, u32 val) noexcept; void Blit(const GPU& gpu) noexcept; private: melonDS::NDS& NDS; typedef union { u64 _contents; struct { u32 Param; u8 Command; }; } CmdFIFOEntry; void UpdateClipMatrix() noexcept; void ResetRenderingState() noexcept; void AddCycles(s32 num) noexcept; void NextVertexSlot() noexcept; void StallPolygonPipeline(s32 delay, s32 nonstalldelay) noexcept; void SubmitPolygon() noexcept; void SubmitVertex() noexcept; void CalculateLighting() noexcept; void BoxTest(const u32* params) noexcept; void PosTest() noexcept; void VecTest(u32 param) noexcept; void CmdFIFOWrite(const CmdFIFOEntry& entry) noexcept; CmdFIFOEntry CmdFIFORead() noexcept; void FinishWork(s32 cycles) noexcept; void VertexPipelineSubmitCmd() noexcept { // vertex commands 0x24, 0x25, 0x26, 0x27, 0x28 if (!(VertexSlotsFree & 0x1)) NextVertexSlot(); else AddCycles(1); NormalPipeline = 0; } void VertexPipelineCmdDelayed6() noexcept { // commands 0x20, 0x30, 0x31, 0x72 that can run 6 cycles after a vertex if (VertexPipeline > 2) AddCycles((VertexPipeline - 2) + 1); else AddCycles(NormalPipeline + 1); NormalPipeline = 0; } void VertexPipelineCmdDelayed8() noexcept { // commands 0x29, 0x2A, 0x2B, 0x33, 0x34, 0x41, 0x60, 0x71 that can run 8 cycles after a vertex if (VertexPipeline > 0) AddCycles(VertexPipeline + 1); else AddCycles(NormalPipeline + 1); NormalPipeline = 0; } void VertexPipelineCmdDelayed4() noexcept { // all other commands can run 4 cycles after a vertex // no need to do much here since that is the minimum AddCycles(NormalPipeline + 1); NormalPipeline = 0; } std::unique_ptr CurrentRenderer = nullptr; u16 RenderXPos = 0; public: FIFO CmdFIFO {}; FIFO CmdPIPE {}; FIFO CmdStallQueue {}; u32 ZeroDotWLimit = 0; u32 GXStat = 0; u32 ExecParams[32] {}; u32 ExecParamCount = 0; s32 CycleCount = 0; s32 VertexPipeline = 0; s32 NormalPipeline = 0; s32 PolygonPipeline = 0; s32 VertexSlotCounter = 0; u32 VertexSlotsFree = 0; u32 NumPushPopCommands = 0; u32 NumTestCommands = 0; u32 MatrixMode = 0; s32 ProjMatrix[16] {}; s32 PosMatrix[16] {}; s32 VecMatrix[16] {}; s32 TexMatrix[16] {}; s32 ClipMatrix[16] {}; bool ClipMatrixDirty = false; u32 Viewport[6] {}; s32 ProjMatrixStack[16] {}; s32 PosMatrixStack[32][16] {}; s32 VecMatrixStack[32][16] {}; s32 TexMatrixStack[16] {}; s32 ProjMatrixStackPointer = 0; s32 PosMatrixStackPointer = 0; s32 TexMatrixStackPointer = 0; u32 NumCommands = 0; u32 CurCommand = 0; u32 ParamCount = 0; u32 TotalParams = 0; bool GeometryEnabled = false; bool RenderingEnabled = false; u32 DispCnt = 0; u8 AlphaRefVal = 0; u8 AlphaRef = 0; u16 ToonTable[32] {}; u16 EdgeTable[8] {}; u32 FogColor = 0; u32 FogOffset = 0; u8 FogDensityTable[32] {}; u32 ClearAttr1 = 0; u32 ClearAttr2 = 0; u32 RenderDispCnt = 0; u8 RenderAlphaRef = 0; u16 RenderToonTable[32] {}; u16 RenderEdgeTable[8] {}; u32 RenderFogColor = 0; u32 RenderFogOffset = 0; u32 RenderFogShift = 0; u8 RenderFogDensityTable[34] {}; u32 RenderClearAttr1 = 0; u32 RenderClearAttr2 = 0; bool RenderFrameIdentical = false; bool AbortFrame = false; u64 Timestamp = 0; u32 PolygonMode = 0; s16 CurVertex[3] {}; u8 VertexColor[3] {}; s16 TexCoords[2] {}; s16 RawTexCoords[2] {}; s16 Normal[3] {}; s16 LightDirection[4][3] {}; u8 LightColor[4][3] {}; u8 MatDiffuse[3] {}; u8 MatAmbient[3] {}; u8 MatSpecular[3] {}; u8 MatEmission[3] {}; bool UseShininessTable = false; u8 ShininessTable[128] {}; u32 PolygonAttr = 0; u32 CurPolygonAttr = 0; u32 TexParam = 0; u32 TexPalette = 0; s32 PosTestResult[4] {}; s16 VecTestResult[3] {}; Vertex TempVertexBuffer[4] {}; u32 VertexNum = 0; u32 VertexNumInPoly = 0; u32 NumConsecutivePolygons = 0; Polygon* LastStripPolygon = nullptr; u32 NumOpaquePolygons = 0; Vertex VertexRAM[6144 * 2] {}; Polygon PolygonRAM[2048 * 2] {}; Vertex* CurVertexRAM = nullptr; Polygon* CurPolygonRAM = nullptr; u32 NumVertices = 0; u32 NumPolygons = 0; u32 CurRAMBank = 0; std::array RenderPolygonRAM {}; u32 RenderNumPolygons = 0; u32 FlushRequest = 0; u32 FlushAttributes = 0; u32 ScrolledLine[256]; }; class Renderer3D { public: virtual ~Renderer3D() = default; Renderer3D(const Renderer3D&) = delete; Renderer3D& operator=(const Renderer3D&) = delete; virtual void Reset(GPU& gpu) = 0; // This "Accelerated" flag currently communicates if the framebuffer should // be allocated differently and other little misc handlers. Ideally there // are more detailed "traits" that we can ask of the Renderer3D type const bool Accelerated; virtual void VCount144(GPU& gpu) {}; virtual void Stop(const GPU& gpu) {} virtual void RenderFrame(GPU& gpu) = 0; virtual void RestartFrame(GPU& gpu) {}; virtual u32* GetLine(int line) = 0; virtual void Blit(const GPU& gpu) {}; virtual void PrepareCaptureFrame() {} protected: Renderer3D(bool Accelerated); }; } #endif