#include "_vmem.h" #include "hw/aica/aica_if.h" #include "hw/pvr/pvr_mem.h" #include "hw/pvr/elan.h" #include "hw/sh4/dyna/blockmanager.h" #include "hw/sh4/sh4_mem.h" #include "oslib/oslib.h" #define HANDLER_MAX 0x1F #define HANDLER_COUNT (HANDLER_MAX+1) //top registered handler static _vmem_handler _vmem_lrp; //handler tables static _vmem_ReadMem8FP* _vmem_RF8[HANDLER_COUNT]; static _vmem_WriteMem8FP* _vmem_WF8[HANDLER_COUNT]; static _vmem_ReadMem16FP* _vmem_RF16[HANDLER_COUNT]; static _vmem_WriteMem16FP* _vmem_WF16[HANDLER_COUNT]; static _vmem_ReadMem32FP* _vmem_RF32[HANDLER_COUNT]; static _vmem_WriteMem32FP* _vmem_WF32[HANDLER_COUNT]; //upper 8b of the address static void* _vmem_MemInfo_ptr[0x100]; #define MAP_RAM_START_OFFSET 0 #define MAP_VRAM_START_OFFSET (MAP_RAM_START_OFFSET+RAM_SIZE) #define MAP_ARAM_START_OFFSET (MAP_VRAM_START_OFFSET+VRAM_SIZE) #define MAP_ERAM_START_OFFSET (MAP_ARAM_START_OFFSET+ARAM_SIZE) void* _vmem_read_const(u32 addr,bool& ismem,u32 sz) { u32 page=addr>>24; unat iirf=(unat)_vmem_MemInfo_ptr[page]; void* ptr=(void*)(iirf&~HANDLER_MAX); if (ptr==0) { ismem=false; const unat id=iirf; if (sz==1) { return (void*)_vmem_RF8[id]; } else if (sz==2) { return (void*)_vmem_RF16[id]; } else if (sz==4) { return (void*)_vmem_RF32[id]; } else { die("Invalid size"); return nullptr; } } else { ismem=true; addr<<=iirf; addr>>=iirf; return &(((u8*)ptr)[addr]); } } void* _vmem_write_const(u32 addr,bool& ismem,u32 sz) { u32 page=addr>>24; unat iirf=(unat)_vmem_MemInfo_ptr[page]; void* ptr=(void*)(iirf&~HANDLER_MAX); if (ptr==0) { ismem=false; const unat id=iirf; if (sz==1) { return (void*)_vmem_WF8[id]; } else if (sz==2) { return (void*)_vmem_WF16[id]; } else if (sz==4) { return (void*)_vmem_WF32[id]; } else { die("Invalid size"); return nullptr; } } else { ismem=true; addr<<=iirf; addr>>=iirf; return &(((u8*)ptr)[addr]); } } template Trv DYNACALL _vmem_readt(u32 addr) { constexpr u32 sz = sizeof(T); u32 page=addr>>24; //1 op, shift/extract unat iirf=(unat)_vmem_MemInfo_ptr[page]; //2 ops, insert + read [vmem table will be on reg ] void* ptr=(void*)(iirf&~HANDLER_MAX); //2 ops, and // 1 op insert if (likely(ptr!=0)) { addr<<=iirf; addr>>=iirf; T data=(*((T*)&(((u8*)ptr)[addr]))); return data; } else { const u32 id=iirf; if (sz==1) { return (T)_vmem_RF8[id](addr); } else if (sz==2) { return (T)_vmem_RF16[id](addr); } else if (sz==4) { return _vmem_RF32[id](addr); } else if (sz==8) { T rv=_vmem_RF32[id](addr); rv|=(T)((u64)_vmem_RF32[id](addr+4)<<32); return rv; } else { die("Invalid size"); return 0; } } } template u8 DYNACALL _vmem_readt(u32 addr); template u16 DYNACALL _vmem_readt(u32 addr); template u32 DYNACALL _vmem_readt(u32 addr); template u64 DYNACALL _vmem_readt(u32 addr); template void DYNACALL _vmem_writet(u32 addr, T data) { constexpr u32 sz = sizeof(T); u32 page=addr>>24; unat iirf=(unat)_vmem_MemInfo_ptr[page]; void* ptr=(void*)(iirf&~HANDLER_MAX); if (likely(ptr!=0)) { addr<<=iirf; addr>>=iirf; *((T*)&(((u8*)ptr)[addr]))=data; } else { const u32 id=iirf; if (sz==1) { _vmem_WF8[id](addr,data); } else if (sz==2) { _vmem_WF16[id](addr,data); } else if (sz==4) { _vmem_WF32[id](addr,data); } else if (sz==8) { _vmem_WF32[id](addr,(u32)data); _vmem_WF32[id](addr+4,(u32)((u64)data>>32)); } else { die("Invalid size"); } } } template void DYNACALL _vmem_writet(u32 addr, u8 data); template void DYNACALL _vmem_writet(u32 addr, u16 data); template void DYNACALL _vmem_writet(u32 addr, u32 data); template void DYNACALL _vmem_writet(u32 addr, u64 data); //ReadMem/WriteMem functions //ReadMem u32 DYNACALL _vmem_ReadMem8SX32(u32 Address) { return _vmem_readt(Address); } u32 DYNACALL _vmem_ReadMem16SX32(u32 Address) { return _vmem_readt(Address); } u8 DYNACALL _vmem_ReadMem8(u32 Address) { return _vmem_readt(Address); } u16 DYNACALL _vmem_ReadMem16(u32 Address) { return _vmem_readt(Address); } u32 DYNACALL _vmem_ReadMem32(u32 Address) { return _vmem_readt(Address); } u64 DYNACALL _vmem_ReadMem64(u32 Address) { return _vmem_readt(Address); } //WriteMem void DYNACALL _vmem_WriteMem8(u32 Address,u8 data) { _vmem_writet(Address,data); } void DYNACALL _vmem_WriteMem16(u32 Address,u16 data) { _vmem_writet(Address,data); } void DYNACALL _vmem_WriteMem32(u32 Address,u32 data) { _vmem_writet(Address,data); } void DYNACALL _vmem_WriteMem64(u32 Address,u64 data) { _vmem_writet(Address,data); } #define MEM_ERROR_RETURN_VALUE 0 //default read handlers static u8 DYNACALL _vmem_ReadMem8_not_mapped(u32 addresss) { INFO_LOG(MEMORY, "[sh4]Read8 from 0x%X, not mapped [_vmem default handler]", addresss); return (u8)MEM_ERROR_RETURN_VALUE; } static u16 DYNACALL _vmem_ReadMem16_not_mapped(u32 addresss) { INFO_LOG(MEMORY, "[sh4]Read16 from 0x%X, not mapped [_vmem default handler]", addresss); return (u16)MEM_ERROR_RETURN_VALUE; } static u32 DYNACALL _vmem_ReadMem32_not_mapped(u32 address) { INFO_LOG(MEMORY, "[sh4]Read32 from 0x%X, not mapped [_vmem default handler]", address); return (u32)MEM_ERROR_RETURN_VALUE; } //default write handers static void DYNACALL _vmem_WriteMem8_not_mapped(u32 addresss,u8 data) { INFO_LOG(MEMORY, "[sh4]Write8 to 0x%X=0x%X, not mapped [_vmem default handler]", addresss, data); } static void DYNACALL _vmem_WriteMem16_not_mapped(u32 addresss,u16 data) { INFO_LOG(MEMORY, "[sh4]Write16 to 0x%X=0x%X, not mapped [_vmem default handler]", addresss, data); } static void DYNACALL _vmem_WriteMem32_not_mapped(u32 addresss,u32 data) { INFO_LOG(MEMORY, "[sh4]Write32 to 0x%X=0x%X, not mapped [_vmem default handler]", addresss, data); } //code to register handlers //0 is considered error :) _vmem_handler _vmem_register_handler( _vmem_ReadMem8FP* read8, _vmem_ReadMem16FP* read16, _vmem_ReadMem32FP* read32, _vmem_WriteMem8FP* write8, _vmem_WriteMem16FP* write16, _vmem_WriteMem32FP* write32 ) { _vmem_handler rv=_vmem_lrp++; verify(rv>rv) rv++; return rv; } //map a registered handler to a mem region void _vmem_map_handler(_vmem_handler Handler,u32 start,u32 end) { verify(start<0x100); verify(end<0x100); verify(start<=end); for (u32 i=start;i<=end;i++) { _vmem_MemInfo_ptr[i] = (u8*)nullptr + Handler; } } //map a memory block to a mem region void _vmem_map_block(void* base,u32 start,u32 end,u32 mask) { verify(start<0x100); verify(end<0x100); verify(start<=end); verify((0xFF & (unat)base)==0); verify(base!=0); u32 j=0; for (u32 i=start;i<=end;i++) { _vmem_MemInfo_ptr[i]=&(((u8*)base)[j&mask]) + FindMask(mask) - (j & mask); j+=0x1000000; } } void _vmem_mirror_mapping(u32 new_region,u32 start,u32 size) { u32 end=start+size-1; verify(start<0x100); verify(end<0x100); verify(start<=end); verify(!((start>=new_region) && (end<=new_region))); u32 j=new_region; for (u32 i=start;i<=end;i++) { _vmem_MemInfo_ptr[j&0xFF]=_vmem_MemInfo_ptr[i&0xFF]; j++; } } //init/reset/term void _vmem_init() { //clear read tables memset(_vmem_RF8,0,sizeof(_vmem_RF8)); memset(_vmem_RF16,0,sizeof(_vmem_RF16)); memset(_vmem_RF32,0,sizeof(_vmem_RF32)); //clear write tables memset(_vmem_WF8,0,sizeof(_vmem_WF8)); memset(_vmem_WF16,0,sizeof(_vmem_WF16)); memset(_vmem_WF32,0,sizeof(_vmem_WF32)); //clear meminfo table memset(_vmem_MemInfo_ptr,0,sizeof(_vmem_MemInfo_ptr)); //reset registration index _vmem_lrp=0; //register default functions (0) for slot 0 _vmem_handler defaultHandler = _vmem_register_handler(0,0,0,0,0,0); verify(defaultHandler == 0); } void _vmem_term() { } u8* virt_ram_base; static bool vmemAvailable = false; static void *malloc_pages(size_t size) { return allocAligned(PAGE_SIZE, size); } static void free_pages(void *p) { freeAligned(p); } #if FEAT_SHREC != DYNAREC_NONE // Resets the FPCB table (by either clearing it to the default val // or by flushing it and making it fault on access again. void _vmem_bm_reset() { // If we allocated it via vmem: if (virt_ram_base) vmem_platform_reset_mem(p_sh4rcb->fpcb, sizeof(p_sh4rcb->fpcb)); else // We allocated it via a regular malloc/new/whatever on the heap bm_vmem_pagefill((void**)p_sh4rcb->fpcb, sizeof(p_sh4rcb->fpcb)); } // This gets called whenever there is a pagefault, it is possible that it lands // on the fpcb memory range, which is allocated on miss. Returning true tells the // fault handler this was us, and that the page is resolved and can continue the execution. bool BM_LockedWrite(u8* address) { if (!virt_ram_base) return false; // No vmem, therefore not us who caused this. uintptr_t ptrint = (uintptr_t)address; uintptr_t start = (uintptr_t)p_sh4rcb->fpcb; uintptr_t end = start + sizeof(p_sh4rcb->fpcb); if (ptrint >= start && ptrint < end) { // Alloc the page then and initialize it to default values void *aligned_addr = (void*)(ptrint & (~PAGE_MASK)); vmem_platform_ondemand_page(aligned_addr, PAGE_SIZE); bm_vmem_pagefill((void**)aligned_addr, PAGE_SIZE); return true; } return false; } #endif bool _vmem_reserve() { static_assert((sizeof(Sh4RCB) % PAGE_SIZE) == 0, "sizeof(Sh4RCB) not multiple of PAGE_SIZE"); if (vmemAvailable) return true; // Use vmem only if settings mandate so, and if we have proper exception handlers. #if !defined(TARGET_NO_EXCEPTIONS) if (!settings.dynarec.disable_nvmem) vmemAvailable = vmem_platform_init((void**)&virt_ram_base, (void**)&p_sh4rcb, RAM_SIZE_MAX + VRAM_SIZE_MAX + ARAM_SIZE_MAX + elan::ERAM_SIZE_MAX); #endif return true; } static void _vmem_term_mappings() { if (!vmemAvailable) { free_pages(p_sh4rcb); p_sh4rcb = nullptr; free_pages(mem_b.data); mem_b.data = nullptr; free_pages(vram.data); vram.data = nullptr; free_pages(aica_ram.data); aica_ram.data = nullptr; free_pages(elan::RAM); elan::RAM = nullptr; } } void _vmem_init_mappings() { _vmem_term_mappings(); // Fallback to statically allocated buffers, this results in slow-ops being generated. if (!vmemAvailable) { WARN_LOG(VMEM, "Warning! nvmem is DISABLED (due to failure or not being built-in"); virt_ram_base = nullptr; // Allocate it all and initialize it. p_sh4rcb = (Sh4RCB*)malloc_pages(sizeof(Sh4RCB)); #if FEAT_SHREC != DYNAREC_NONE bm_vmem_pagefill((void**)p_sh4rcb->fpcb, sizeof(p_sh4rcb->fpcb)); #endif memset(&p_sh4rcb->cntx, 0, sizeof(p_sh4rcb->cntx)); mem_b.size = RAM_SIZE; mem_b.data = (u8*)malloc_pages(RAM_SIZE); vram.size = VRAM_SIZE; vram.data = (u8*)malloc_pages(VRAM_SIZE); aica_ram.size = ARAM_SIZE; aica_ram.data = (u8*)malloc_pages(ARAM_SIZE); elan::RAM = (u8*)malloc_pages(elan::ERAM_SIZE); } else { NOTICE_LOG(VMEM, "Info: nvmem is enabled"); INFO_LOG(VMEM, "Info: p_sh4rcb: %p virt_ram_base: %p", p_sh4rcb, virt_ram_base); // Map the different parts of the memory file into the new memory range we got. const vmem_mapping mem_mappings[] = { {0x00000000, 0x00800000, 0, 0, false}, // Area 0 -> unused {0x00800000, 0x01000000, MAP_ARAM_START_OFFSET, ARAM_SIZE, false}, // Aica {0x01000000, 0x04000000, 0, 0, false}, // More unused {0x04000000, 0x05000000, MAP_VRAM_START_OFFSET, VRAM_SIZE, true}, // Area 1 (vram, 16MB, wrapped on DC as 2x8MB) {0x05000000, 0x06000000, 0, 0, false}, // 32 bit path (unused) {0x06000000, 0x07000000, MAP_VRAM_START_OFFSET, VRAM_SIZE, true}, // VRAM mirror {0x07000000, 0x08000000, 0, 0, false}, // 32 bit path (unused) mirror {0x08000000, 0x0A000000, 0, 0, false}, // Area 2 {0x0A000000, 0x0C000000, MAP_ERAM_START_OFFSET, elan::ERAM_SIZE, true}, // Area 2 (Elan RAM) {0x0C000000, 0x10000000, MAP_RAM_START_OFFSET, RAM_SIZE, true}, // Area 3 (main RAM + 3 mirrors) {0x10000000, 0x20000000, 0, 0, false}, // Area 4-7 (unused) // This is outside of the 512MB addr space. We map 8MB in all cases to help some games read past the end of aica ram {0x20000000, 0x20800000, MAP_ARAM_START_OFFSET, ARAM_SIZE, true}, // writable aica ram }; vmem_platform_create_mappings(&mem_mappings[0], ARRAY_SIZE(mem_mappings)); // Point buffers to actual data pointers aica_ram.data = &virt_ram_base[0x20000000]; // Points to the writable AICA addrspace vram.data = &virt_ram_base[0x04000000]; // Points to first vram mirror (writable and lockable) mem_b.data = &virt_ram_base[0x0C000000]; // Main memory, first mirror elan::RAM = &virt_ram_base[0x0A000000]; aica_ram.size = ARAM_SIZE; vram.size = VRAM_SIZE; mem_b.size = RAM_SIZE; } // Clear out memory aica_ram.Zero(); vram.Zero(); mem_b.Zero(); NOTICE_LOG(VMEM, "BASE %p RAM(%d MB) %p VRAM64(%d MB) %p ARAM(%d MB) %p", virt_ram_base, RAM_SIZE / 1024 / 1024, mem_b.data, VRAM_SIZE / 1024 / 1024, vram.data, ARAM_SIZE / 1024 / 1024, aica_ram.data); } void _vmem_release() { if (virt_ram_base) { vmem_platform_destroy(); virt_ram_base = nullptr; } else { _vmem_unprotect_vram(0, VRAM_SIZE); _vmem_term_mappings(); } vmemAvailable = false; } void _vmem_protect_vram(u32 addr, u32 size) { addr &= VRAM_MASK; if (_nvmem_enabled()) { mem_region_lock(virt_ram_base + 0x04000000 + addr, size); // P0 //mem_region_lock(virt_ram_base + 0x06000000 + addr, size); // P0 - mirror if (VRAM_SIZE == 0x800000) { // wraps when only 8MB VRAM mem_region_lock(virt_ram_base + 0x04000000 + addr + VRAM_SIZE, size); // P0 wrap //mem_region_lock(virt_ram_base + 0x06000000 + addr + VRAM_SIZE, size); // P0 mirror wrap } } else { mem_region_lock(&vram[addr], size); } } void _vmem_unprotect_vram(u32 addr, u32 size) { addr &= VRAM_MASK; if (_nvmem_enabled()) { mem_region_unlock(virt_ram_base + 0x04000000 + addr, size); // P0 //mem_region_unlock(virt_ram_base + 0x06000000 + addr, size); // P0 - mirror if (VRAM_SIZE == 0x800000) { // wraps when only 8MB VRAM mem_region_unlock(virt_ram_base + 0x04000000 + addr + VRAM_SIZE, size); // P0 wrap //mem_region_unlock(virt_ram_base + 0x06000000 + addr + VRAM_SIZE, size); // P0 mirror wrap } } else { mem_region_unlock(&vram[addr], size); } } u32 _vmem_get_vram_offset(void *addr) { if (_nvmem_enabled()) { ptrdiff_t offset = (u8*)addr - virt_ram_base; if (offset < 0 || offset >= 0x20000000) return -1; if ((offset >> 24) != 4) return -1; return offset & VRAM_MASK; } else { ptrdiff_t offset = (u8*)addr - &vram[0]; if (offset < 0 || offset >= VRAM_SIZE) return -1; return (u32)offset; } }