// Copyright 2008 Dolphin Emulator Project // Licensed under GPLv2+ // Refer to the license.txt file included. // DL facts: // Ikaruga uses (nearly) NO display lists! // Zelda WW uses TONS of display lists // Zelda TP uses almost 100% display lists except menus (we like this!) // Super Mario Galaxy has nearly all geometry and more than half of the state in DLs (great!) // Note that it IS NOT GENERALLY POSSIBLE to precompile display lists! You can compile them as they // are // while interpreting them, and hope that the vertex format doesn't change, though, if you do it // right // when they are called. The reason is that the vertex format affects the sizes of the vertices. #include "VideoCommon/OpcodeDecoding.h" #include "Common/CommonTypes.h" #include "Common/Logging/Log.h" #include "Common/MsgHandler.h" #include "Core/FifoPlayer/FifoRecorder.h" #include "Core/HW/Memmap.h" #include "VideoCommon/BPMemory.h" #include "VideoCommon/CPMemory.h" #include "VideoCommon/CommandProcessor.h" #include "VideoCommon/DataReader.h" #include "VideoCommon/Fifo.h" #include "VideoCommon/Statistics.h" #include "VideoCommon/VertexLoaderManager.h" #include "VideoCommon/VideoCommon.h" #include "VideoCommon/XFMemory.h" bool g_bRecordFifoData = false; namespace OpcodeDecoder { static bool s_is_fifo_error_seen = false; static u32 InterpretDisplayList(u32 address, u32 size) { u8* start_address; if (Fifo::UseDeterministicGPUThread()) start_address = static_cast(Fifo::PopFifoAuxBuffer(size)); else start_address = Memory::GetPointer(address); u32 cycles = 0; // Avoid the crash if Memory::GetPointer failed .. if (start_address != nullptr) { // temporarily swap dl and non-dl (small "hack" for the stats) g_stats.SwapDL(); Run(DataReader(start_address, start_address + size), &cycles, true); INCSTAT(g_stats.this_frame.num_dlists_called); // un-swap g_stats.SwapDL(); } return cycles; } static void InterpretDisplayListPreprocess(u32 address, u32 size) { u8* const start_address = Memory::GetPointer(address); Fifo::PushFifoAuxBuffer(start_address, size); if (start_address == nullptr) return; Run(DataReader(start_address, start_address + size), nullptr, true); } void Init() { s_is_fifo_error_seen = false; } template u8* Run(DataReader src, u32* cycles, bool in_display_list) { u32 total_cycles = 0; u8* opcode_start; while (true) { opcode_start = src.GetPointer(); if (!src.size()) goto end; const u8 cmd_byte = src.Read(); int refarray; switch (cmd_byte) { case GX_NOP: total_cycles += 6; // Hm, this means that we scan over nop streams pretty slowly... break; case GX_UNKNOWN_RESET: total_cycles += 6; // Datel software uses this command DEBUG_LOG(VIDEO, "GX Reset?: %08x", cmd_byte); break; case GX_LOAD_CP_REG: { if (src.size() < 1 + 4) goto end; total_cycles += 12; const u8 sub_cmd = src.Read(); const u32 value = src.Read(); LoadCPReg(sub_cmd, value, is_preprocess); if (!is_preprocess) INCSTAT(g_stats.this_frame.num_cp_loads); } break; case GX_LOAD_XF_REG: { if (src.size() < 4) goto end; const u32 cmd2 = src.Read(); const int transfer_size = ((cmd2 >> 16) & 15) + 1; if (src.size() < transfer_size * sizeof(u32)) goto end; total_cycles += 18 + 6 * transfer_size; if (!is_preprocess) { const u32 xf_address = cmd2 & 0xFFFF; LoadXFReg(transfer_size, xf_address, src); INCSTAT(g_stats.this_frame.num_xf_loads); } src.Skip(transfer_size); } break; case GX_LOAD_INDX_A: // used for position matrices refarray = 0xC; goto load_indx; case GX_LOAD_INDX_B: // used for normal matrices refarray = 0xD; goto load_indx; case GX_LOAD_INDX_C: // used for postmatrices refarray = 0xE; goto load_indx; case GX_LOAD_INDX_D: // used for lights refarray = 0xF; goto load_indx; load_indx: if (src.size() < 4) goto end; total_cycles += 6; if (is_preprocess) PreprocessIndexedXF(src.Read(), refarray); else LoadIndexedXF(src.Read(), refarray); break; case GX_CMD_CALL_DL: { if (src.size() < 8) goto end; const u32 address = src.Read(); const u32 count = src.Read(); if (in_display_list) { total_cycles += 6; INFO_LOG(VIDEO, "recursive display list detected"); } else { if (is_preprocess) InterpretDisplayListPreprocess(address, count); else total_cycles += 6 + InterpretDisplayList(address, count); } } break; case GX_CMD_UNKNOWN_METRICS: // zelda 4 swords calls it and checks the metrics registers after // that total_cycles += 6; DEBUG_LOG(VIDEO, "GX 0x44: %08x", cmd_byte); break; case GX_CMD_INVL_VC: // Invalidate Vertex Cache total_cycles += 6; DEBUG_LOG(VIDEO, "Invalidate (vertex cache?)"); break; case GX_LOAD_BP_REG: // In skipped_frame case: We have to let BP writes through because they set // tokens and stuff. TODO: Call a much simplified LoadBPReg instead. { if (src.size() < 4) goto end; total_cycles += 12; const u32 bp_cmd = src.Read(); if (is_preprocess) { LoadBPRegPreprocess(bp_cmd); } else { LoadBPReg(bp_cmd); INCSTAT(g_stats.this_frame.num_bp_loads); } } break; // draw primitives default: if ((cmd_byte & 0xC0) == 0x80) { // load vertices if (src.size() < 2) goto end; const u16 num_vertices = src.Read(); const int bytes = VertexLoaderManager::RunVertices( cmd_byte & GX_VAT_MASK, // Vertex loader index (0 - 7) (cmd_byte & GX_PRIMITIVE_MASK) >> GX_PRIMITIVE_SHIFT, num_vertices, src, is_preprocess); if (bytes < 0) goto end; src.Skip(bytes); // 4 GPU ticks per vertex, 3 CPU ticks per GPU tick total_cycles += num_vertices * 4 * 3 + 6; } else { if (!s_is_fifo_error_seen) CommandProcessor::HandleUnknownOpcode(cmd_byte, opcode_start, is_preprocess); ERROR_LOG(VIDEO, "FIFO: Unknown Opcode(0x%02x @ %p, preprocessing = %s)", cmd_byte, opcode_start, is_preprocess ? "yes" : "no"); s_is_fifo_error_seen = true; total_cycles += 1; } break; } // Display lists get added directly into the FIFO stream if (!is_preprocess && g_bRecordFifoData && cmd_byte != GX_CMD_CALL_DL) { const u8* const opcode_end = src.GetPointer(); FifoRecorder::GetInstance().WriteGPCommand(opcode_start, u32(opcode_end - opcode_start)); } } end: if (cycles) { *cycles = total_cycles; } return opcode_start; } template u8* Run(DataReader src, u32* cycles, bool in_display_list); template u8* Run(DataReader src, u32* cycles, bool in_display_list); } // namespace OpcodeDecoder