/* * Glide64 - Glide video plugin for Nintendo 64 emulators. * Copyright (c) 2002 Dave2001 * Copyright (c) 2003-2009 Sergey 'Gonetz' Lipski * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA */ //**************************************************************** // // Glide64 - Glide Plugin for Nintendo 64 emulators // Project started on December 29th, 2001 // // Authors: // Dave2001, original author, founded the project in 2001, left it in 2002 // Gugaman, joined the project in 2002, left it in 2002 // Sergey 'Gonetz' Lipski, joined the project in 2002, main author since fall of 2002 // Hiroshi 'KoolSmoky' Morii, joined the project in 2007 // //**************************************************************** // // To modify Glide64: // * Write your name and (optional)email, commented by your work, so I know who did it, and so that you can find which parts you modified when it comes time to send it to me. // * Do NOT send me the whole project or file that you modified. Take out your modified code sections, and tell me where to put them. If people sent the whole thing, I would have many different versions, but no idea how to combine them all. // //**************************************************************** #include "Gfx_1.3.h" #include "TexCache.h" #include "Combine.h" #include "Util.h" #include #include void LoadTex(int id, int tmu); uint8_t tex1[1024 * 1024 * 4]; // temporary texture uint8_t tex2[1024 * 1024 * 4]; uint8_t *texture; uint8_t *texture_buffer = tex1; #include "TexLoad.h" // texture loading functions, ONLY INCLUDE IN THIS FILE!!! #include "MiClWr32b.h" #include "MiClWr16b.h" // Mirror/Clamp/Wrap functions, ONLY INCLUDE IN THIS FILE!!! #include "MiClWr8b.h" // Mirror/Clamp/Wrap functions, ONLY INCLUDE IN THIS FILE!!! #include "TexConv.h" // texture conversions, ONLY INCLUDE IN THIS FILE!!! #include "TexMod.h" #include "TexModCI.h" #include "CRC.h" #ifdef TEXTURE_FILTER // Hiroshi Morii extern int ghq_dmptex_toggle_key; #endif typedef struct TEXINFO_t { int real_image_width, real_image_height; // FOR ALIGNMENT PURPOSES ONLY!!! int tile_width, tile_height; int mask_width, mask_height; int width, height; int wid_64, line; uint32_t crc; uint32_t flags; int splits, splitheight; #ifdef TEXTURE_FILTER uint64 ricecrc; #endif } TEXINFO; TEXINFO texinfo[2]; int tex_found[2][MAX_TMU]; #ifdef TEXTURE_FILTER typedef struct HIRESTEX_t { int width, height; uint16_t format; uint8_t *data; } HIRESTEX; #endif //**************************************************************** // List functions typedef struct NODE_t { uint32_t crc; uintptr_t data; int tmu; int number; NODE_t *pNext; } NODE; NODE *cachelut[65536]; void AddToList(NODE **list, uint32_t crc, uintptr_t data, int tmu, int number) { NODE *node = new NODE; node->crc = crc; node->data = data; node->tmu = tmu; node->number = number; node->pNext = *list; *list = node; rdp.n_cached[tmu] ++; if (voodoo.tex_UMA) rdp.n_cached[tmu ^ 1] = rdp.n_cached[tmu]; } void DeleteList(NODE **list) { while (*list) { NODE *next = (*list)->pNext; delete (*list); *list = next; } } void TexCacheInit() { for (int i = 0; i < 65536; i++) { cachelut[i] = NULL; } } //**************************************************************** // ClearCache - clear the texture cache for BOTH tmus void ClearCache() { voodoo.tmem_ptr[0] = offset_textures; rdp.n_cached[0] = 0; voodoo.tmem_ptr[1] = voodoo.tex_UMA ? offset_textures : offset_texbuf1; rdp.n_cached[1] = 0; for (int i = 0; i < 65536; i++) { DeleteList(&cachelut[i]); } } //**************************************************************** uint32_t textureCRC(uint8_t *addr, int width, int height, int line) { uint32_t crc = 0; uint32_t *pixelpos; unsigned int i; uint64_t twopixel_crc; pixelpos = (uint32_t*)addr; for (; height; height--) { for (i = width; i; --i) { twopixel_crc = i * (uint64_t)(pixelpos[1] + pixelpos[0] + crc); crc = (uint32_t)(((twopixel_crc >> 32) + twopixel_crc) & 0xFFFFFFFF); pixelpos += 2; } crc = ((unsigned int)height * (uint64_t)crc >> 32) + height * crc; pixelpos = (uint32_t *)((char *)pixelpos + line); } return crc; } // GetTexInfo - gets information for either t0 or t1, checks if in cache & fills tex_found void GetTexInfo(int id, int tile) { WriteTrace(TraceRDP, TraceDebug, " | |-+ GetTexInfo (id: %d, tile: %d)", id, tile); // this is the NEW cache searching, searches only textures with similar crc's int t; for (t = 0; t < MAX_TMU; t++) tex_found[id][t] = -1; TBUFF_COLOR_IMAGE * pFBTex = 0; if (rdp.aTBuffTex[0] && rdp.aTBuffTex[0]->tile == id) pFBTex = rdp.aTBuffTex[0]; else if (rdp.aTBuffTex[1] && rdp.aTBuffTex[1]->tile == id) pFBTex = rdp.aTBuffTex[1]; if (pFBTex && pFBTex->cache) return; TEXINFO *info = &texinfo[id]; int tile_width, tile_height; int mask_width, mask_height; int width, height; int wid_64, line, bpl; // Get width and height tile_width = rdp.tiles[tile].lr_s - rdp.tiles[tile].ul_s + 1; tile_height = rdp.tiles[tile].lr_t - rdp.tiles[tile].ul_t + 1; mask_width = (rdp.tiles[tile].mask_s == 0) ? (tile_width) : (1 << rdp.tiles[tile].mask_s); mask_height = (rdp.tiles[tile].mask_t == 0) ? (tile_height) : (1 << rdp.tiles[tile].mask_t); if (g_settings->alt_tex_size) { // ** ALTERNATE TEXTURE SIZE METHOD ** // Helps speed in some games that loaded weird-sized textures, but could break other // textures. // Get the width/height to load if ((rdp.tiles[tile].clamp_s && tile_width <= 256) || (mask_width > 256)) { // loading width width = minval(mask_width, tile_width); // actual width rdp.tiles[tile].width = tile_width; } else { // wrap all the way width = minval(mask_width, tile_width); // changed from mask_width only rdp.tiles[tile].width = width; } if ((rdp.tiles[tile].clamp_t && tile_height <= 256) || (mask_height > 256)) { // loading height height = minval(mask_height, tile_height); // actual height rdp.tiles[tile].height = tile_height; } else { // wrap all the way height = minval(mask_height, tile_height); rdp.tiles[tile].height = height; } } else { // ** NORMAL TEXTURE SIZE METHOD ** // This is the 'correct' method for determining texture size, but may cause certain // textures to load too large & make the whole game go slow. if (mask_width > 256 && mask_height > 256) { mask_width = tile_width; mask_height = tile_height; } // Get the width/height to load if ((rdp.tiles[tile].clamp_s && tile_width <= 256))//|| (mask_width > 256)) { // loading width width = minval(mask_width, tile_width); // actual width rdp.tiles[tile].width = tile_width; } else { // wrap all the way width = mask_width; rdp.tiles[tile].width = mask_width; } if ((rdp.tiles[tile].clamp_t && tile_height <= 256) || (mask_height > 256)) { // loading height height = minval(mask_height, tile_height); // actual height rdp.tiles[tile].height = tile_height; } else { // wrap all the way height = mask_height; rdp.tiles[tile].height = mask_height; } } // without any large texture fixing-up; for alignment int real_image_width = rdp.tiles[tile].width; int real_image_height = rdp.tiles[tile].height; int crc_height = height; if (rdp.timg.set_by == 1) crc_height = tile_height; bpl = width << rdp.tiles[tile].size >> 1; // ** COMMENT THIS TO DISABLE LARGE TEXTURES #ifdef LARGE_TEXTURE_HANDLING if (!voodoo.sup_large_tex && width > 256) { info->splits = ((width - 1) >> 8) + 1; info->splitheight = rdp.tiles[tile].height; rdp.tiles[tile].height *= info->splits; rdp.tiles[tile].width = 256; width = 256; } else #endif // ** { info->splits = 1; } WriteTrace(TraceRDP, TraceDebug, " | | |-+ Texture approved:"); WriteTrace(TraceRDP, TraceDebug, " | | | |- tmem: %08lx", rdp.tiles[tile].t_mem); WriteTrace(TraceRDP, TraceDebug, " | | | |- load width: %d", width); WriteTrace(TraceRDP, TraceDebug, " | | | |- load height: %d", height); WriteTrace(TraceRDP, TraceDebug, " | | | |- actual width: %d", rdp.tiles[tile].width); WriteTrace(TraceRDP, TraceDebug, " | | | |- actual height: %d", rdp.tiles[tile].height); WriteTrace(TraceRDP, TraceDebug, " | | | |- size: %d", rdp.tiles[tile].size); WriteTrace(TraceRDP, TraceDebug, " | | | +- format: %d", rdp.tiles[tile].format); WriteTrace(TraceRDP, TraceDebug, " | | |- Calculating CRC... "); // ** CRC CHECK wid_64 = width << (rdp.tiles[tile].size) >> 1; if (rdp.tiles[tile].size == 3) { if (wid_64 & 15) wid_64 += 16; wid_64 &= 0xFFFFFFF0; } else { if (wid_64 & 7) wid_64 += 8; // round up } wid_64 = wid_64 >> 3; // Texture too big for tmem & needs to wrap? (trees in mm) if (rdp.tiles[tile].t_mem + minval(height, tile_height) * (rdp.tiles[tile].line << 3) > 4096) { WriteTrace(TraceRDP, TraceDebug, "TEXTURE WRAPS TMEM!!! "); // calculate the y value that intersects at 4096 bytes int y = (4096 - rdp.tiles[tile].t_mem) / (rdp.tiles[tile].line << 3); rdp.tiles[tile].clamp_t = 0; rdp.tiles[tile].lr_t = rdp.tiles[tile].ul_t + y - 1; // calc mask int shift; for (shift = 0; (1 << shift) < y; shift++); rdp.tiles[tile].mask_t = shift; // restart the function WriteTrace(TraceRDP, TraceDebug, "restarting..."); GetTexInfo(id, tile); return; } line = rdp.tiles[tile].line; if (rdp.tiles[tile].size == 3) line <<= 1; uint32_t crc = 0; if (g_settings->fast_crc) { line = (line - wid_64) << 3; if (wid_64 < 1) wid_64 = 1; uint8_t * addr = (((uint8_t*)rdp.tmem) + (rdp.tiles[tile].t_mem << 3)); if (crc_height > 0) // Check the CRC { if (rdp.tiles[tile].size < 3) crc = textureCRC(addr, wid_64, crc_height, line); else //32b texture { int line_2 = line >> 1; int wid_64_2 = maxval(1, wid_64 >> 1); crc = textureCRC(addr, wid_64_2, crc_height, line_2); crc += textureCRC(addr + 0x800, wid_64_2, crc_height, line_2); } } } else { crc = 0xFFFFFFFF; uintptr_t addr = uintptr_t(rdp.tmem) + (rdp.tiles[tile].t_mem << 3); uint32_t line2 = maxval(line, 1); if (rdp.tiles[tile].size < 3) { line2 <<= 3; for (int y = 0; y < crc_height; y++) { crc = CRC32(crc, reinterpret_cast(addr), bpl); addr += line2; } } else //32b texture { line2 <<= 2; //32b texel is split in two 16b parts, so bpl/2 and line/2. //Min value for bpl is 4, because when width==1 first 2 bytes of tmem will not be used. bpl = maxval(bpl >> 1, 4); for (int y = 0; y < crc_height; y++) { crc = CRC32(crc, reinterpret_cast(addr), bpl); crc = CRC32(crc, reinterpret_cast(addr + 0x800), bpl); addr += line2; } } line = (line - wid_64) << 3; if (wid_64 < 1) wid_64 = 1; } if ((rdp.tiles[tile].size < 2) && (rdp.tlut_mode || rdp.tiles[tile].format == 2)) { if (rdp.tiles[tile].size == 0) crc += rdp.pal_8_crc[rdp.tiles[tile].palette]; else crc += rdp.pal_256_crc; } WriteTrace(TraceRDP, TraceDebug, "Done. CRC is: %08lx.", crc); uint32_t flags = (rdp.tiles[tile].clamp_s << 23) | (rdp.tiles[tile].mirror_s << 22) | (rdp.tiles[tile].mask_s << 18) | (rdp.tiles[tile].clamp_t << 17) | (rdp.tiles[tile].mirror_t << 16) | (rdp.tiles[tile].mask_t << 12); info->real_image_width = real_image_width; info->real_image_height = real_image_height; info->tile_width = tile_width; info->tile_height = tile_height; info->mask_width = mask_width; info->mask_height = mask_height; info->width = width; info->height = height; info->wid_64 = wid_64; info->line = line; info->crc = crc; info->flags = flags; // Search the texture cache for this texture WriteTrace(TraceRDP, TraceDebug, " | | |-+ Checking cache..."); CACHE_LUT *cache; if (rdp.noise == RDP::noise_texture) return; uint32_t mod, modcolor, modcolor1, modcolor2, modfactor; if (id == 0) { mod = cmb.mod_0; modcolor = cmb.modcolor_0; modcolor1 = cmb.modcolor1_0; modcolor2 = cmb.modcolor2_0; modfactor = cmb.modfactor_0; } else { mod = cmb.mod_1; modcolor = cmb.modcolor_1; modcolor1 = cmb.modcolor1_1; modcolor2 = cmb.modcolor2_1; modfactor = cmb.modfactor_1; } NODE *node = cachelut[crc >> 16]; uint32_t mod_mask = (rdp.tiles[tile].format == 2) ? 0xFFFFFFFF : 0xF0F0F0F0; while (node) { if (node->crc == crc) { cache = (CACHE_LUT*)node->data; if (/*tex_found[id][node->tmu] == -1 && rdp.tiles[tile].palette == cache->palette && rdp.tiles[tile].format == cache->format && rdp.tiles[tile].size == cache->size &&*/ rdp.tiles[tile].width == cache->width && rdp.tiles[tile].height == cache->height && flags == cache->flags) { if (!(mod + cache->mod) || (cache->mod == mod && (cache->mod_color&mod_mask) == (modcolor&mod_mask) && (cache->mod_color1&mod_mask) == (modcolor1&mod_mask) && (cache->mod_color2&mod_mask) == (modcolor2&mod_mask) && abs((int)(cache->mod_factor - modfactor)) < 8)) { WriteTrace(TraceRDP, TraceDebug, " | | | |- Texture found in cache (tmu=%d).", node->tmu); tex_found[id][node->tmu] = node->number; if (voodoo.tex_UMA) { tex_found[id][node->tmu ^ 1] = node->number; return; } } } } node = node->pNext; } WriteTrace(TraceRDP, TraceDebug, " | | | +- Done.\n | | +- GetTexInfo end"); } //**************************************************************** // ChooseBestTmu - chooses the best TMU to load to (the one with the most memory) int ChooseBestTmu(int tmu1, int tmu2) { if (!GfxInitDone) return tmu1; if (voodoo.tex_UMA) return 0; if (tmu1 >= voodoo.num_tmu) return tmu2; if (tmu2 >= voodoo.num_tmu) return tmu1; if (voodoo.tex_max_addr[tmu1] - voodoo.tmem_ptr[tmu1] > voodoo.tex_max_addr[tmu2] - voodoo.tmem_ptr[tmu2]) return tmu1; else return tmu2; } //**************************************************************** // SelectTBuffTex - select texture from texture buffer static void SelectTBuffTex(TBUFF_COLOR_IMAGE * pTBuffTex) { WriteTrace(TraceRDP, TraceDebug, "SelectTBuffTex: tex: %d, tmu: %d, tile: %d", rdp.tex, pTBuffTex->tmu, pTBuffTex->tile); grTexSource(pTBuffTex->tile, pTBuffTex->tex_addr, GR_MIPMAPLEVELMASK_BOTH, &(pTBuffTex->info)); } //**************************************************************** // TexCache - does texture loading after combiner is set int SwapTextureBuffer(); void TexCache() { WriteTrace(TraceRDP, TraceDebug, " |-+ TexCache called"); #ifdef TEXTURE_FILTER /* Hiroshi Morii */ // POSTNAPALM if (g_settings->ghq_use && g_settings->ghq_hirs_dump) { /* Force reload hi-res textures. Useful for texture artists */ if (CheckKeyPressed(G64_VK_R, 0x0001)) { if (ext_ghq_reloadhirestex()) ClearCache(); } /* Turn on texture dump */ else if (CheckKeyPressed(G64_VK_D, 0x0001)) { extern void DisplayLoadProgress(const wchar_t *format, ...); ghq_dmptex_toggle_key = !ghq_dmptex_toggle_key; if (ghq_dmptex_toggle_key) { DisplayLoadProgress(L"Texture dump - ON"); ClearCache(); } else { DisplayLoadProgress(L"Texture dump - OFF"); } pjutil::Sleep(1000); } } #endif if (rdp.tex & 1) GetTexInfo(0, rdp.cur_tile); if (rdp.tex & 2) GetTexInfo(1, rdp.cur_tile + 1); TBUFF_COLOR_IMAGE * aTBuff[2] = { 0, 0 }; if (rdp.aTBuffTex[0]) aTBuff[rdp.aTBuffTex[0]->tile] = rdp.aTBuffTex[0]; if (rdp.aTBuffTex[1]) aTBuff[rdp.aTBuffTex[1]->tile] = rdp.aTBuffTex[1]; #define TMUMODE_NORMAL 0 #define TMUMODE_PASSTHRU 1 #define TMUMODE_NONE 2 int tmu_0, tmu_1; int tmu_0_mode = 0, tmu_1_mode = 0; // Select the best TMUs to use (removed 3 tmu support, unnecessary) if (rdp.tex == 3) // T0 and T1 { tmu_0 = 0; tmu_1 = 1; } else if (rdp.tex == 2) // T1 { if (tex_found[1][0] != -1) // T1 found in tmu 0 tmu_1 = 0; else if (tex_found[1][1] != -1) // T1 found in tmu 1 tmu_1 = 1; else // T1 not found tmu_1 = ChooseBestTmu(0, 1); tmu_0 = !tmu_1; tmu_0_mode = (tmu_0 == 1) ? TMUMODE_NONE : TMUMODE_PASSTHRU; } else if (rdp.tex == 1) // T0 { if (tex_found[0][0] != -1) // T0 found in tmu 0 tmu_0 = 0; else if (tex_found[0][1] != -1) // T0 found in tmu 1 tmu_0 = 1; else // T0 not found tmu_0 = ChooseBestTmu(0, 1); tmu_1 = !tmu_0; tmu_1_mode = (tmu_1 == 1) ? TMUMODE_NONE : TMUMODE_PASSTHRU; } else // no texture { tmu_0 = 0; tmu_0_mode = TMUMODE_NONE; tmu_1 = 0; tmu_1_mode = TMUMODE_NONE; } WriteTrace(TraceRDP, TraceDebug, " | |-+ Modes set:\n | | |- tmu_0 = %d\n | | |- tmu_1 = %d", tmu_0, tmu_1); WriteTrace(TraceRDP, TraceDebug, " | | |- tmu_0_mode = %d\n | | |- tmu_1_mode = %d", tmu_0_mode, tmu_1_mode); if (tmu_0_mode == TMUMODE_PASSTHRU) { cmb.tmu0_func = cmb.tmu0_a_func = GR_COMBINE_FUNCTION_SCALE_OTHER; cmb.tmu0_fac = cmb.tmu0_a_fac = GR_COMBINE_FACTOR_ONE; if (cmb.tex_cmb_ext_use) { cmb.t0c_ext_a = GR_CMBX_OTHER_TEXTURE_RGB; cmb.t0c_ext_a_mode = GR_FUNC_MODE_X; cmb.t0c_ext_b = GR_CMBX_LOCAL_TEXTURE_RGB; cmb.t0c_ext_b_mode = GR_FUNC_MODE_ZERO; cmb.t0c_ext_c = GR_CMBX_ZERO; cmb.t0c_ext_c_invert = 1; cmb.t0c_ext_d = GR_CMBX_ZERO; cmb.t0c_ext_d_invert = 0; cmb.t0a_ext_a = GR_CMBX_OTHER_TEXTURE_ALPHA; cmb.t0a_ext_a_mode = GR_FUNC_MODE_X; cmb.t0a_ext_b = GR_CMBX_LOCAL_TEXTURE_ALPHA; cmb.t0a_ext_b_mode = GR_FUNC_MODE_ZERO; cmb.t0a_ext_c = GR_CMBX_ZERO; cmb.t0a_ext_c_invert = 1; cmb.t0a_ext_d = GR_CMBX_ZERO; cmb.t0a_ext_d_invert = 0; } } else if (tmu_0_mode == TMUMODE_NONE) { cmb.tmu0_func = cmb.tmu0_a_func = GR_COMBINE_FUNCTION_NONE; cmb.tmu0_fac = cmb.tmu0_a_fac = GR_COMBINE_FACTOR_NONE; if (cmb.tex_cmb_ext_use) { cmb.t0c_ext_a = GR_CMBX_LOCAL_TEXTURE_RGB; cmb.t0c_ext_a_mode = GR_FUNC_MODE_ZERO; cmb.t0c_ext_b = GR_CMBX_LOCAL_TEXTURE_RGB; cmb.t0c_ext_b_mode = GR_FUNC_MODE_ZERO; cmb.t0c_ext_c = GR_CMBX_ZERO; cmb.t0c_ext_c_invert = 0; cmb.t0c_ext_d = GR_CMBX_ZERO; cmb.t0c_ext_d_invert = 0; cmb.t0a_ext_a = GR_CMBX_LOCAL_TEXTURE_ALPHA; cmb.t0a_ext_a_mode = GR_FUNC_MODE_ZERO; cmb.t0a_ext_b = GR_CMBX_LOCAL_TEXTURE_ALPHA; cmb.t0a_ext_b_mode = GR_FUNC_MODE_ZERO; cmb.t0a_ext_c = GR_CMBX_ZERO; cmb.t0a_ext_c_invert = 0; cmb.t0a_ext_d = GR_CMBX_ZERO; cmb.t0a_ext_d_invert = 0; } } if (tmu_1_mode == TMUMODE_PASSTHRU) { cmb.tmu1_func = cmb.tmu1_a_func = GR_COMBINE_FUNCTION_SCALE_OTHER; cmb.tmu1_fac = cmb.tmu1_a_fac = GR_COMBINE_FACTOR_ONE; if (cmb.tex_cmb_ext_use) { cmb.t1c_ext_a = GR_CMBX_OTHER_TEXTURE_RGB; cmb.t1c_ext_a_mode = GR_FUNC_MODE_X; cmb.t1c_ext_b = GR_CMBX_LOCAL_TEXTURE_RGB; cmb.t1c_ext_b_mode = GR_FUNC_MODE_ZERO; cmb.t1c_ext_c = GR_CMBX_ZERO; cmb.t1c_ext_c_invert = 1; cmb.t1c_ext_d = GR_CMBX_ZERO; cmb.t1c_ext_d_invert = 0; cmb.t1a_ext_a = GR_CMBX_OTHER_TEXTURE_ALPHA; cmb.t1a_ext_a_mode = GR_FUNC_MODE_X; cmb.t1a_ext_b = GR_CMBX_LOCAL_TEXTURE_ALPHA; cmb.t1a_ext_b_mode = GR_FUNC_MODE_ZERO; cmb.t1a_ext_c = GR_CMBX_ZERO; cmb.t1a_ext_c_invert = 1; cmb.t1a_ext_d = GR_CMBX_ZERO; cmb.t1a_ext_d_invert = 0; } } else if (tmu_1_mode == TMUMODE_NONE) { cmb.tmu1_func = cmb.tmu1_a_func = GR_COMBINE_FUNCTION_NONE; cmb.tmu1_fac = cmb.tmu1_a_fac = GR_COMBINE_FACTOR_NONE; if (cmb.tex_cmb_ext_use) { cmb.t1c_ext_a = GR_CMBX_LOCAL_TEXTURE_RGB; cmb.t1c_ext_a_mode = GR_FUNC_MODE_ZERO; cmb.t1c_ext_b = GR_CMBX_LOCAL_TEXTURE_RGB; cmb.t1c_ext_b_mode = GR_FUNC_MODE_ZERO; cmb.t1c_ext_c = GR_CMBX_ZERO; cmb.t1c_ext_c_invert = 0; cmb.t1c_ext_d = GR_CMBX_ZERO; cmb.t1c_ext_d_invert = 0; cmb.t1a_ext_a = GR_CMBX_LOCAL_TEXTURE_ALPHA; cmb.t1a_ext_a_mode = GR_FUNC_MODE_ZERO; cmb.t1a_ext_b = GR_CMBX_LOCAL_TEXTURE_ALPHA; cmb.t1a_ext_b_mode = GR_FUNC_MODE_ZERO; cmb.t1a_ext_c = GR_CMBX_ZERO; cmb.t1a_ext_c_invert = 0; cmb.t1a_ext_d = GR_CMBX_ZERO; cmb.t1a_ext_d_invert = 0; } } // little change to make single-tmu cards look better, use first texture no matter what if (voodoo.num_tmu == 1) { if (rdp.best_tex == 0) { cmb.tmu0_func = cmb.tmu0_a_func = GR_COMBINE_FUNCTION_LOCAL; cmb.tmu0_fac = cmb.tmu0_a_fac = GR_COMBINE_FACTOR_NONE; tmu_0 = 0; tmu_1 = 1; } else { cmb.tmu1_func = cmb.tmu1_a_func = GR_COMBINE_FUNCTION_LOCAL; cmb.tmu1_fac = cmb.tmu1_a_fac = GR_COMBINE_FACTOR_NONE; tmu_1 = 0; tmu_0 = 1; } } rdp.t0 = tmu_0; rdp.t1 = tmu_1; // SET the combiner if (GfxInitDone) { if (rdp.allow_combine) { // Now actually combine if (cmb.cmb_ext_use) { WriteTrace(TraceRDP, TraceDebug, " | | | |- combiner extension"); if (!(cmb.cmb_ext_use & COMBINE_EXT_COLOR)) ColorCombinerToExtension(); if (!(cmb.cmb_ext_use & COMBINE_EXT_ALPHA)) AlphaCombinerToExtension(); cmb.grColorCombineExt(cmb.c_ext_a, cmb.c_ext_a_mode, cmb.c_ext_b, cmb.c_ext_b_mode, cmb.c_ext_c, cmb.c_ext_c_invert, cmb.c_ext_d, cmb.c_ext_d_invert, 0, 0); cmb.grAlphaCombineExt(cmb.a_ext_a, cmb.a_ext_a_mode, cmb.a_ext_b, cmb.a_ext_b_mode, cmb.a_ext_c, cmb.a_ext_c_invert, cmb.a_ext_d, cmb.a_ext_d_invert, 0, 0); } else { grColorCombine(cmb.c_fnc, cmb.c_fac, cmb.c_loc, cmb.c_oth, FXFALSE); grAlphaCombine(cmb.a_fnc, cmb.a_fac, cmb.a_loc, cmb.a_oth, FXFALSE); } grConstantColorValue(cmb.ccolor); grAlphaBlendFunction(cmb.abf1, cmb.abf2, GR_BLEND_ZERO, GR_BLEND_ZERO); if (!rdp.tex) //nothing more to do return; } if (tmu_1 < voodoo.num_tmu) { if (cmb.tex_cmb_ext_use) { WriteTrace(TraceRDP, TraceDebug, " | | | |- combiner extension tmu1"); if (!(cmb.tex_cmb_ext_use & TEX_COMBINE_EXT_COLOR)) TexColorCombinerToExtension(GR_TMU1); if (!(cmb.tex_cmb_ext_use & TEX_COMBINE_EXT_ALPHA)) TexAlphaCombinerToExtension(GR_TMU1); cmb.grTexColorCombineExt(tmu_1, cmb.t1c_ext_a, cmb.t1c_ext_a_mode, cmb.t1c_ext_b, cmb.t1c_ext_b_mode, cmb.t1c_ext_c, cmb.t1c_ext_c_invert, cmb.t1c_ext_d, cmb.t1c_ext_d_invert, 0, 0); cmb.grTexAlphaCombineExt(tmu_1, cmb.t1a_ext_a, cmb.t1a_ext_a_mode, cmb.t1a_ext_b, cmb.t1a_ext_b_mode, cmb.t1a_ext_c, cmb.t1a_ext_c_invert, cmb.t1a_ext_d, cmb.t1a_ext_d_invert, 0, 0); cmb.grConstantColorValueExt(tmu_1, cmb.tex_ccolor); } else { grTexCombine(tmu_1, cmb.tmu1_func, cmb.tmu1_fac, cmb.tmu1_a_func, cmb.tmu1_a_fac, cmb.tmu1_invert, cmb.tmu1_a_invert); if (cmb.combine_ext) cmb.grConstantColorValueExt(tmu_1, 0); } grTexDetailControl(tmu_1, cmb.dc1_lodbias, cmb.dc1_detailscale, cmb.dc1_detailmax); grTexLodBiasValue(tmu_1, cmb.lodbias1); } if (tmu_0 < voodoo.num_tmu) { if (cmb.tex_cmb_ext_use) { WriteTrace(TraceRDP, TraceDebug, " | | | |- combiner extension tmu0"); if (!(cmb.tex_cmb_ext_use & TEX_COMBINE_EXT_COLOR)) TexColorCombinerToExtension(GR_TMU0); if (!(cmb.tex_cmb_ext_use & TEX_COMBINE_EXT_ALPHA)) TexAlphaCombinerToExtension(GR_TMU0); cmb.grTexColorCombineExt(tmu_0, cmb.t0c_ext_a, cmb.t0c_ext_a_mode, cmb.t0c_ext_b, cmb.t0c_ext_b_mode, cmb.t0c_ext_c, cmb.t0c_ext_c_invert, cmb.t0c_ext_d, cmb.t0c_ext_d_invert, 0, 0); cmb.grTexAlphaCombineExt(tmu_0, cmb.t0a_ext_a, cmb.t0a_ext_a_mode, cmb.t0a_ext_b, cmb.t0a_ext_b_mode, cmb.t0a_ext_c, cmb.t0a_ext_c_invert, cmb.t0a_ext_d, cmb.t0a_ext_d_invert, 0, 0); cmb.grConstantColorValueExt(tmu_0, cmb.tex_ccolor); } else { grTexCombine(tmu_0, cmb.tmu0_func, cmb.tmu0_fac, cmb.tmu0_a_func, cmb.tmu0_a_fac, cmb.tmu0_invert, cmb.tmu0_a_invert); if (cmb.combine_ext) cmb.grConstantColorValueExt(tmu_0, 0); } grTexDetailControl(tmu_0, cmb.dc0_lodbias, cmb.dc0_detailscale, cmb.dc0_detailmax); grTexLodBiasValue(tmu_0, cmb.lodbias0); } } if ((rdp.tex & 1) && tmu_0 < voodoo.num_tmu) { if (aTBuff[0] && aTBuff[0]->cache) { WriteTrace(TraceRDP, TraceDebug, " | |- Hires tex T0 found in cache."); if (GfxInitDone) { rdp.cur_cache[0] = aTBuff[0]->cache; rdp.cur_cache[0]->last_used = frame_count; rdp.cur_cache[0]->uses = rdp.debug_n; } } else if (tex_found[0][tmu_0] != -1) { WriteTrace(TraceRDP, TraceDebug, " | |- T0 found in cache."); if (GfxInitDone) { CACHE_LUT *cache = voodoo.tex_UMA ? &rdp.cache[0][tex_found[0][0]] : &rdp.cache[tmu_0][tex_found[0][tmu_0]]; rdp.cur_cache_n[0] = tex_found[0][tmu_0]; rdp.cur_cache[0] = cache; rdp.cur_cache[0]->last_used = frame_count; rdp.cur_cache[0]->uses = rdp.debug_n; grTexSource(tmu_0, (voodoo.tex_min_addr[tmu_0] + cache->tmem_addr), GR_MIPMAPLEVELMASK_BOTH, &cache->t_info); } } else LoadTex(0, tmu_0); } if ((rdp.tex & 2) && tmu_1 < voodoo.num_tmu) { if (aTBuff[1] && aTBuff[1]->cache) { WriteTrace(TraceRDP, TraceDebug, " | |- Hires tex T1 found in cache."); if (GfxInitDone) { rdp.cur_cache[1] = aTBuff[1]->cache; rdp.cur_cache[1]->last_used = frame_count; rdp.cur_cache[1]->uses = rdp.debug_n; } } else if (tex_found[1][tmu_1] != -1) { WriteTrace(TraceRDP, TraceDebug, " | |- T1 found in cache."); if (GfxInitDone) { CACHE_LUT *cache = voodoo.tex_UMA ? &rdp.cache[0][tex_found[1][0]] : &rdp.cache[tmu_1][tex_found[1][tmu_1]]; rdp.cur_cache_n[1] = tex_found[1][tmu_1]; rdp.cur_cache[1] = cache; rdp.cur_cache[1]->last_used = frame_count; rdp.cur_cache[1]->uses = rdp.debug_n; grTexSource(tmu_1, (voodoo.tex_min_addr[tmu_1] + cache->tmem_addr), GR_MIPMAPLEVELMASK_BOTH, &cache->t_info); } } else LoadTex(1, tmu_1); } if (GfxInitDone) { int tmu_v[2]; tmu_v[0] = tmu_0; tmu_v[1] = tmu_1; for (int i = 0; i < 2; i++) { const int tmu = tmu_v[i]; if (tmu >= voodoo.num_tmu) continue; int tile = rdp.cur_tile + i; if (g_settings->filtering == 0) { int filter = (rdp.filter_mode != 2) ? GR_TEXTUREFILTER_POINT_SAMPLED : GR_TEXTUREFILTER_BILINEAR; grTexFilterMode(tmu, filter, filter); } else { int filter = (g_settings->filtering == 1) ? GR_TEXTUREFILTER_BILINEAR : GR_TEXTUREFILTER_POINT_SAMPLED; grTexFilterMode(tmu, filter, filter); } if (rdp.cur_cache[i]) { uint32_t mode_s, mode_t; int clamp_s, clamp_t; if (rdp.force_wrap && !rdp.texrecting) { clamp_s = rdp.tiles[tile].clamp_s && rdp.tiles[tile].lr_s - rdp.tiles[tile].ul_s < 256; clamp_t = rdp.tiles[tile].clamp_t && rdp.tiles[tile].lr_t - rdp.tiles[tile].ul_t < 256; } else { clamp_s = (rdp.tiles[tile].clamp_s || rdp.tiles[tile].mask_s == 0) && rdp.tiles[tile].lr_s - rdp.tiles[tile].ul_s < 256; clamp_t = (rdp.tiles[tile].clamp_t || rdp.tiles[tile].mask_t == 0) && rdp.tiles[tile].lr_t - rdp.tiles[tile].ul_t < 256; } if (rdp.cur_cache[i]->f_mirror_s) mode_s = GR_TEXTURECLAMP_MIRROR_EXT; else if (rdp.cur_cache[i]->f_wrap_s) mode_s = GR_TEXTURECLAMP_WRAP; else if (clamp_s) mode_s = GR_TEXTURECLAMP_CLAMP; else { if (rdp.tiles[tile].mirror_s && voodoo.sup_mirroring) mode_s = GR_TEXTURECLAMP_MIRROR_EXT; else mode_s = GR_TEXTURECLAMP_WRAP; } if (rdp.cur_cache[i]->f_mirror_t) mode_t = GR_TEXTURECLAMP_MIRROR_EXT; else if (rdp.cur_cache[i]->f_wrap_t) mode_t = GR_TEXTURECLAMP_WRAP; else if (clamp_t) mode_t = GR_TEXTURECLAMP_CLAMP; else { if (rdp.tiles[tile].mirror_t && voodoo.sup_mirroring) mode_t = GR_TEXTURECLAMP_MIRROR_EXT; else mode_t = GR_TEXTURECLAMP_WRAP; } grTexClampMode(tmu, mode_s, mode_t); } if (aTBuff[i] && (rdp.tex&(i + 1))) SelectTBuffTex(aTBuff[i]); } } WriteTrace(TraceRDP, TraceDebug, " | +- TexCache End"); } #ifdef TEXTURE_FILTER /** cite from RiceVideo */ inline uint32_t CalculateDXT(uint32_t txl2words) { if (txl2words == 0) return 1; else return (2048 + txl2words - 1) / txl2words; } uint32_t sizeBytes[4] = { 0, 1, 2, 4 }; inline uint32_t Txl2Words(uint32_t width, uint32_t size) { return size == 0 ? maxval(1, width / 16) : maxval(1, width*sizeBytes[size] / 8); } inline uint32_t ReverseDXT(uint32_t val, uint32_t /*lrs*/, uint32_t width, uint32_t size) { if (val == 0x800) return 1; int low = 2047 / val; if (CalculateDXT(low) > val) low++; int high = 2047 / (val - 1); if (low == high) return low; for (int i = low; i <= high; i++) { if (Txl2Words(width, size) == (uint32_t)i) return i; } return (low + high) / 2; } /** end RiceVideo cite */ #endif //**************************************************************** // LoadTex - does the actual texture loading after everything is prepared void LoadTex(int id, int tmu) { WriteTrace(TraceRDP, TraceDebug, " | |-+ LoadTex (id: %d, tmu: %d)", id, tmu); int td = rdp.cur_tile + id; int lod, aspect; CACHE_LUT *cache; if (texinfo[id].width < 0 || texinfo[id].height < 0) return; // Clear the cache if it's full if (rdp.n_cached[tmu] >= MAX_CACHE) { WriteTrace(TraceRDP, TraceDebug, "Cache count reached, clearing..."); ClearCache(); if (id == 1 && rdp.tex == 3) LoadTex(0, rdp.t0); } // Get this cache object cache = voodoo.tex_UMA ? &rdp.cache[0][rdp.n_cached[0]] : &rdp.cache[tmu][rdp.n_cached[tmu]]; memset(cache, 0, sizeof(*cache)); rdp.cur_cache[id] = cache; rdp.cur_cache_n[id] = rdp.n_cached[tmu]; //!Hackalert //GoldenEye water texture. It has CI format in fact, but the game set it to RGBA if ((g_settings->hacks&hack_GoldenEye) && rdp.tiles[td].format == 0 && rdp.tlut_mode == 2 && rdp.tiles[td].size == 2) { rdp.tiles[td].format = 2; rdp.tiles[td].size = 1; } // Set the data cache->line = rdp.tiles[td].line; cache->addr = rdp.addr[rdp.tiles[td].t_mem]; cache->crc = texinfo[id].crc; cache->palette = rdp.tiles[td].palette; cache->width = rdp.tiles[td].width; cache->height = rdp.tiles[td].height; cache->format = rdp.tiles[td].format; cache->size = rdp.tiles[td].size; cache->tmem_addr = voodoo.tmem_ptr[tmu]; cache->set_by = rdp.timg.set_by; cache->texrecting = rdp.texrecting; cache->last_used = frame_count; cache->uses = rdp.debug_n; cache->flags = texinfo[id].flags; cache->f_mirror_s = FALSE; cache->f_mirror_t = FALSE; cache->f_wrap_s = FALSE; cache->f_wrap_t = FALSE; #ifdef TEXTURE_FILTER cache->is_hires_tex = FALSE; cache->ricecrc = texinfo[id].ricecrc; #endif // Add this cache to the list AddToList(&cachelut[cache->crc >> 16], cache->crc, uintptr_t(cache), tmu, rdp.n_cached[tmu]); // temporary cache->t_info.format = GR_TEXFMT_ARGB_1555; // Calculate lod and aspect uint32_t size_x = rdp.tiles[td].width; uint32_t size_y = rdp.tiles[td].height; // make size_x and size_y both powers of two if (!voodoo.sup_large_tex) { if (size_x > 256) size_x = 256; if (size_y > 256) size_y = 256; } int shift; for (shift = 0; (1 << shift) < (int)size_x; shift++); size_x = 1 << shift; for (shift = 0; (1 << shift) < (int)size_y; shift++); size_y = 1 << shift; // Voodoo 1 support is all here, it will automatically mirror to the full extent. if (!voodoo.sup_mirroring) { if (rdp.tiles[td].mirror_s && !rdp.tiles[td].clamp_s && (voodoo.sup_large_tex || size_x <= 128)) size_x <<= 1; if (rdp.tiles[td].mirror_t && !rdp.tiles[td].clamp_t && (voodoo.sup_large_tex || size_y <= 128)) size_y <<= 1; } // Calculate the maximum size int size_max = maxval(size_x, size_y); uint32_t real_x = size_max, real_y = size_max; switch (size_max) { case 1: lod = GR_LOD_LOG2_1; cache->scale = 256.0f; break; case 2: lod = GR_LOD_LOG2_2; cache->scale = 128.0f; break; case 4: lod = GR_LOD_LOG2_4; cache->scale = 64.0f; break; case 8: lod = GR_LOD_LOG2_8; cache->scale = 32.0f; break; case 16: lod = GR_LOD_LOG2_16; cache->scale = 16.0f; break; case 32: lod = GR_LOD_LOG2_32; cache->scale = 8.0f; break; case 64: lod = GR_LOD_LOG2_64; cache->scale = 4.0f; break; case 128: lod = GR_LOD_LOG2_128; cache->scale = 2.0f; break; case 256: lod = GR_LOD_LOG2_256; cache->scale = 1.0f; break; case 512: lod = GR_LOD_LOG2_512; cache->scale = 0.5f; break; default: lod = GR_LOD_LOG2_1024; cache->scale = 0.25f; break; } // Calculate the aspect ratio if (size_x >= size_y) { int ratio = size_x / size_y; switch (ratio) { case 1: aspect = GR_ASPECT_LOG2_1x1; cache->scale_x = 1.0f; cache->scale_y = 1.0f; break; case 2: aspect = GR_ASPECT_LOG2_2x1; cache->scale_x = 1.0f; cache->scale_y = 0.5f; real_y >>= 1; break; case 4: aspect = GR_ASPECT_LOG2_4x1; cache->scale_x = 1.0f; cache->scale_y = 0.25f; real_y >>= 2; break; default: aspect = GR_ASPECT_LOG2_8x1; cache->scale_x = 1.0f; cache->scale_y = 0.125f; real_y >>= 3; break; } } else { int ratio = size_y / size_x; switch (ratio) { case 2: aspect = GR_ASPECT_LOG2_1x2; cache->scale_x = 0.5f; cache->scale_y = 1.0f; real_x >>= 1; break; case 4: aspect = GR_ASPECT_LOG2_1x4; cache->scale_x = 0.25f; cache->scale_y = 1.0f; real_x >>= 2; break; default: aspect = GR_ASPECT_LOG2_1x8; cache->scale_x = 0.125f; cache->scale_y = 1.0f; real_x >>= 3; break; } } if (real_x != cache->width || real_y != cache->height) { cache->scale_x *= (float)cache->width / (float)real_x; cache->scale_y *= (float)cache->height / (float)real_y; } int splits = texinfo[id].splits; cache->splits = texinfo[id].splits; cache->splitheight = real_y / cache->splits; if (cache->splitheight < texinfo[id].splitheight) cache->splitheight = texinfo[id].splitheight; // ** Calculate alignment values int wid = cache->width; int hei = cache->height; if (splits > 1) { wid = texinfo[id].real_image_width; hei = texinfo[id].real_image_height; } cache->c_off = cache->scale * 0.5f; if (wid != 1) cache->c_scl_x = cache->scale; else cache->c_scl_x = 0.0f; if (hei != 1) cache->c_scl_y = cache->scale; else cache->c_scl_y = 0.0f; // ** uint32_t mod, modcolor, modcolor1, modcolor2, modfactor; if (id == 0) { mod = cmb.mod_0; modcolor = cmb.modcolor_0; modcolor1 = cmb.modcolor1_0; modcolor2 = cmb.modcolor2_0; modfactor = cmb.modfactor_0; } else { mod = cmb.mod_1; modcolor = cmb.modcolor_1; modcolor1 = cmb.modcolor1_1; modcolor2 = cmb.modcolor2_1; modfactor = cmb.modfactor_1; } uint16_t tmp_pal[256]; int modifyPalette = (mod && (cache->format == 2) && (rdp.tlut_mode == 2)); if (modifyPalette) { memcpy(tmp_pal, rdp.pal_8, 512); ModifyPalette(mod, modcolor, modcolor1, modfactor); } cache->mod = mod; cache->mod_color = modcolor; cache->mod_color1 = modcolor1; cache->mod_factor = modfactor; for (int t = 0; t < 2; t++) { if (rdp.aTBuffTex[t] && rdp.aTBuffTex[t]->tile == id) //texture buffer will be used instead of frame buffer texture { rdp.aTBuffTex[t]->cache = cache; WriteTrace(TraceRDP, TraceDebug, "tbuff_tex selected: %d, tile=%d", t, id); return; } } uint32_t result = 0; // keep =0 so it doesn't mess up on the first split texture = tex1; // Hiroshi Morii // NOTE: Loading Hi-res texture packs and filtering should be done // before the texture is modified with color palettes, etc. // // Since the internal texture identification needs Glide64CRC, (RiceCRC // doesn't always return unique values) it seems reasonable that the // extra CRC calculation for hires textures should be executed only // when we get passed the texture ram cache and texture buffers for // minimal calculation overhead. // #ifdef TEXTURE_FILTER // Hiroshi Morii GHQTexInfo ghqTexInfo; memset(&ghqTexInfo, 0, sizeof(GHQTexInfo)); uint32_t g64_crc = cache->crc; if (g_settings->ghq_use) { int bpl; uint8_t* addr = (uint8_t*)(gfx.RDRAM + rdp.addr[rdp.tiles[td].t_mem]); int tile_width = texinfo[id].width; int tile_height = texinfo[id].height; LOAD_TILE_INFO &info = rdp.load_info[rdp.tiles[td].t_mem]; if (rdp.timg.set_by == 1) { bpl = info.tex_width << info.tex_size >> 1; addr += (info.tile_ul_t * bpl) + (((info.tile_ul_s << info.tex_size) + 1) >> 1); tile_width = minval(info.tile_width, info.tex_width); if (info.tex_size > rdp.tiles[td].size) tile_width <<= info.tex_size - rdp.tiles[td].size; if (rdp.tiles[td].lr_t > rdp.bg_image_height) tile_height = rdp.bg_image_height - rdp.tiles[td].ul_t; else tile_height = info.tile_height; } else { if (rdp.tiles[td].size == 3) bpl = rdp.tiles[td].line << 4; else if (info.dxt == 0) bpl = rdp.tiles[td].line << 3; else { uint32_t dxt = info.dxt; if (dxt > 1) dxt = ReverseDXT(dxt, info.tile_width, texinfo[id].width, rdp.tiles[td].size); bpl = dxt << 3; } } // uint8_t* addr = (uint8_t*)(gfx.RDRAM+rdp.addr[rdp.tiles[td].t_mem] + (rdp.tiles[td].ul_t * bpl) + (((rdp.tiles[td].ul_s<>1)); uint8_t * paladdr = 0; uint16_t * palette = 0; if ((rdp.tiles[td].size < 2) && (rdp.tlut_mode || rdp.tiles[td].format == 2)) { if (rdp.tiles[td].size == 1) paladdr = (uint8_t*)(rdp.pal_8_rice); else if (g_settings->ghq_hirs_altcrc) paladdr = (uint8_t*)(rdp.pal_8_rice + (rdp.tiles[td].palette << 5)); else paladdr = (uint8_t*)(rdp.pal_8_rice + (rdp.tiles[td].palette << 4)); palette = (rdp.pal_8 + (rdp.tiles[td].palette << 4)); } // XXX: Special combiner modes are ignored for hires textures // for now. Come back to this later!! The following is needed // for (2xSai, hq4x, etc) enhanced/filtered textures. g64_crc = CRC32(g64_crc, &cache->mod, 4); g64_crc = CRC32(g64_crc, &cache->mod_color, 4); g64_crc = CRC32(g64_crc, &cache->mod_color1, 4); //g64_crc = CRC32( g64_crc, &cache->mod_color2, 4 ); // not used? g64_crc = CRC32(g64_crc, &cache->mod_factor, 4); cache->ricecrc = ext_ghq_checksum(addr, tile_width, tile_height, (unsigned short)(rdp.tiles[td].format << 8 | rdp.tiles[td].size), bpl, paladdr); WriteTrace(TraceRDP, TraceDebug, "CI RICE CRC. format: %d, size: %d, CRC: %08lx, PalCRC: %08lx", rdp.tiles[td].format, rdp.tiles[td].size, (uint32_t)(cache->ricecrc & 0xFFFFFFFF), (uint32_t)(cache->ricecrc >> 32)); if (ext_ghq_hirestex((uint64)g64_crc, cache->ricecrc, palette, &ghqTexInfo)) { cache->is_hires_tex = ghqTexInfo.is_hires_tex; if (!ghqTexInfo.is_hires_tex && aspect != ghqTexInfo.aspectRatioLog2) ghqTexInfo.data = 0; //if aspects of current texture and found filtered texture are different, texture must be filtered again. } } // ** handle texture splitting ** if (ghqTexInfo.data) ;//do nothing else #endif if (splits > 1) { cache->scale_y = 0.125f; int i; for (i = 0; i < splits; i++) { int start_dst = i * cache->splitheight * 256; // start lower start_dst <<= HIWORD(result); // 1st time, result is set to 0, but start_dst is 0 anyway so it doesn't matter int start_src = i * 256; // start 256 more to the right start_src = start_src << (rdp.tiles[td].size) >> 1; if (rdp.tiles[td].size == 3) start_src >>= 1; result = load_table[rdp.tiles[td].size][rdp.tiles[td].format] (uintptr_t(texture) + start_dst, uintptr_t(rdp.tmem) + (rdp.tiles[td].t_mem << 3) + start_src, texinfo[id].wid_64, texinfo[id].height, texinfo[id].line, real_x, td); uint32_t size = HIWORD(result); // clamp so that it looks somewhat ok when wrapping if (size == 1) Clamp16bT((texture)+start_dst, texinfo[id].height, real_x, cache->splitheight); else if (size != 2) Clamp8bT((texture)+start_dst, texinfo[id].height, real_x, cache->splitheight); else Clamp32bT((texture)+start_dst, texinfo[id].height, real_x, cache->splitheight); } } // ** end texture splitting ** else { result = load_table[rdp.tiles[td].size][rdp.tiles[td].format] (uintptr_t(texture), uintptr_t(rdp.tmem) + (rdp.tiles[td].t_mem << 3), texinfo[id].wid_64, texinfo[id].height, texinfo[id].line, real_x, td); uint32_t size = HIWORD(result); int min_x, min_y; if (rdp.tiles[td].mask_s != 0) min_x = minval((int)real_x, 1 << rdp.tiles[td].mask_s); else min_x = real_x; if (rdp.tiles[td].mask_t != 0) min_y = minval((int)real_y, 1 << rdp.tiles[td].mask_t); else min_y = real_y; // Load using mirroring/clamping if (min_x > texinfo[id].width) { if (size == 1) Clamp16bS((texture), texinfo[id].width, min_x, real_x, texinfo[id].height); else if (size != 2) Clamp8bS((texture), texinfo[id].width, min_x, real_x, texinfo[id].height); else Clamp32bS((texture), texinfo[id].width, min_x, real_x, texinfo[id].height); } if (texinfo[id].width < (int)real_x) { if (rdp.tiles[td].mirror_s) { if (size == 1) Mirror16bS((texture), rdp.tiles[td].mask_s, real_x, real_x, texinfo[id].height); else if (size != 2) Mirror8bS((texture), rdp.tiles[td].mask_s, real_x, real_x, texinfo[id].height); else Mirror32bS((texture), rdp.tiles[td].mask_s, real_x, real_x, texinfo[id].height); } else { if (size == 1) Wrap16bS((texture), rdp.tiles[td].mask_s, real_x, real_x, texinfo[id].height); else if (size != 2) Wrap8bS((texture), rdp.tiles[td].mask_s, real_x, real_x, texinfo[id].height); else Wrap32bS((texture), rdp.tiles[td].mask_s, real_x, real_x, texinfo[id].height); } } if (min_y > texinfo[id].height) { if (size == 1) Clamp16bT((texture), texinfo[id].height, real_x, min_y); else if (size != 2) Clamp8bT((texture), texinfo[id].height, real_x, min_y); else Clamp32bT((texture), texinfo[id].height, real_x, min_y); } if (texinfo[id].height < (int)real_y) { if (rdp.tiles[td].mirror_t) { if (size == 1) Mirror16bT((texture), rdp.tiles[td].mask_t, real_y, real_x); else if (size != 2) Mirror8bT((texture), rdp.tiles[td].mask_t, real_y, real_x); else Mirror32bT((texture), rdp.tiles[td].mask_t, real_y, real_x); } else { if (size == 1) Wrap16bT((texture), rdp.tiles[td].mask_t, real_y, real_x); else if (size != 2) Wrap8bT((texture), rdp.tiles[td].mask_t, real_y, real_x); else Wrap32bT((texture), rdp.tiles[td].mask_t, real_y, real_x); } } } if (modifyPalette) { memcpy(rdp.pal_8, tmp_pal, 512); } #ifdef TEXTURE_FILTER if (mod && !modifyPalette && !ghqTexInfo.data) #else if (mod && !modifyPalette) #endif { // Convert the texture to ARGB 4444 if (LOWORD(result) == GR_TEXFMT_ARGB_1555) { TexConv_ARGB1555_ARGB4444((texture), (tex2), real_x, real_y); texture = tex2; } else if (LOWORD(result) == GR_TEXFMT_ALPHA_INTENSITY_88) { TexConv_AI88_ARGB4444((texture), (tex2), real_x, real_y); texture = tex2; } else if (LOWORD(result) == GR_TEXFMT_ALPHA_INTENSITY_44) { TexConv_AI44_ARGB4444((texture), (tex2), real_x, real_y); texture = tex2; } else if (LOWORD(result) == GR_TEXFMT_ALPHA_8) { TexConv_A8_ARGB4444((texture), (tex2), real_x, real_y); texture = tex2; } /*else if (LOWORD(result) == GR_TEXFMT_ARGB_4444) { memcpy (tex2, texture, (real_x*real_y) << 1); texture = tex2; }*/ // we can skip memcpy since "texture" won't be swapped between "tex1" and "tex2" after this. // Hiroshi Morii result = (1 << 16) | GR_TEXFMT_ARGB_4444; // Now convert the color to the same modcolor = ((modcolor & 0xF0000000) >> 16) | ((modcolor & 0x00F00000) >> 12) | ((modcolor & 0x0000F000) >> 8) | ((modcolor & 0x000000F0) >> 4); modcolor1 = ((modcolor1 & 0xF0000000) >> 16) | ((modcolor1 & 0x00F00000) >> 12) | ((modcolor1 & 0x0000F000) >> 8) | ((modcolor1 & 0x000000F0) >> 4); modcolor2 = ((modcolor2 & 0xF0000000) >> 16) | ((modcolor2 & 0x00F00000) >> 12) | ((modcolor2 & 0x0000F000) >> 8) | ((modcolor2 & 0x000000F0) >> 4); int size = (real_x * real_y) << 1; switch (mod) { case TMOD_TEX_INTER_COLOR_USING_FACTOR: mod_tex_inter_color_using_factor((uint16_t*)texture, size, modcolor, modfactor); break; case TMOD_TEX_INTER_COL_USING_COL1: mod_tex_inter_col_using_col1((uint16_t*)texture, size, modcolor, modcolor1); break; case TMOD_FULL_COLOR_SUB_TEX: mod_full_color_sub_tex((uint16_t*)texture, size, modcolor); break; case TMOD_COL_INTER_COL1_USING_TEX: mod_col_inter_col1_using_tex((uint16_t*)texture, size, modcolor, modcolor1); break; case TMOD_COL_INTER_COL1_USING_TEXA: mod_col_inter_col1_using_texa((uint16_t*)texture, size, modcolor, modcolor1); break; case TMOD_COL_INTER_COL1_USING_TEXA__MUL_TEX: mod_col_inter_col1_using_texa__mul_tex((uint16_t*)texture, size, modcolor, modcolor1); break; case TMOD_COL_INTER_TEX_USING_TEXA: mod_col_inter_tex_using_texa((uint16_t*)texture, size, modcolor); break; case TMOD_COL2_INTER__COL_INTER_COL1_USING_TEX__USING_TEXA: mod_col2_inter__col_inter_col1_using_tex__using_texa((uint16_t*)texture, size, modcolor, modcolor1, modcolor2); break; case TMOD_TEX_SCALE_FAC_ADD_FAC: mod_tex_scale_fac_add_fac((uint16_t*)texture, size, modfactor); break; case TMOD_TEX_SUB_COL_MUL_FAC_ADD_TEX: mod_tex_sub_col_mul_fac_add_tex((uint16_t*)texture, size, modcolor, modfactor); break; case TMOD_TEX_SCALE_COL_ADD_COL: mod_tex_scale_col_add_col((uint16_t*)texture, size, modcolor, modcolor1); break; case TMOD_TEX_ADD_COL: mod_tex_add_col((uint16_t*)texture, size, modcolor); break; case TMOD_TEX_SUB_COL: mod_tex_sub_col((uint16_t*)texture, size, modcolor); break; case TMOD_TEX_SUB_COL_MUL_FAC: mod_tex_sub_col_mul_fac((uint16_t*)texture, size, modcolor, modfactor); break; case TMOD_COL_INTER_TEX_USING_COL1: mod_col_inter_tex_using_col1((uint16_t*)texture, size, modcolor, modcolor1); break; case TMOD_COL_MUL_TEXA_ADD_TEX: mod_col_mul_texa_add_tex((uint16_t*)texture, size, modcolor); break; case TMOD_COL_INTER_TEX_USING_TEX: mod_col_inter_tex_using_tex((uint16_t*)texture, size, modcolor); break; case TMOD_TEX_INTER_NOISE_USING_COL: mod_tex_inter_noise_using_col((uint16_t*)texture, size, modcolor); break; case TMOD_TEX_INTER_COL_USING_TEXA: mod_tex_inter_col_using_texa((uint16_t*)texture, size, modcolor); break; case TMOD_TEX_MUL_COL: mod_tex_mul_col((uint16_t*)texture, size, modcolor); break; case TMOD_TEX_SCALE_FAC_ADD_COL: mod_tex_scale_fac_add_col((uint16_t*)texture, size, modcolor, modfactor); break; default: ; } } cache->t_info.format = LOWORD(result); cache->realwidth = real_x; cache->realheight = real_y; cache->lod = lod; cache->aspect = aspect; if (GfxInitDone) { #ifdef TEXTURE_FILTER // Hiroshi Morii if (g_settings->ghq_use) { if (!ghqTexInfo.data && ghq_dmptex_toggle_key) { unsigned char *tmpbuf = (unsigned char*)texture; int tmpwidth = real_x; if (texinfo[id].splits > 1) { int dstpixoffset, srcpixoffset; int shift; switch (LOWORD(result) & 0x7fff) { // XXX is there a better way of determining the pixel color depth? case GR_TEXFMT_ARGB_8888: shift = 3; break; case GR_TEXFMT_ALPHA_INTENSITY_44: case GR_TEXFMT_ALPHA_8: shift = 0; break; default: shift = 1; } tmpwidth = texinfo[id].real_image_width; tmpbuf = (unsigned char*)malloc((256 * 256) << 3); // XXX performance overhead for (int i = 0; i < cache->splitheight; i++) { dstpixoffset = texinfo[id].real_image_width * i; srcpixoffset = 256 * i; for (int k = 0; k < texinfo[id].splits; k++) { memcpy(tmpbuf + (dstpixoffset << shift), texture + (srcpixoffset << shift), (256 << shift)); dstpixoffset += 256; srcpixoffset += (256 * cache->splitheight); } } } ext_ghq_dmptx(tmpbuf, (int)texinfo[id].real_image_width, (int)texinfo[id].real_image_height, (int)tmpwidth, (unsigned short)LOWORD(result), (unsigned short)((cache->format << 8) | (cache->size)), cache->ricecrc); if (tmpbuf != texture && tmpbuf) { free(tmpbuf); } } if (!ghqTexInfo.data) if (!g_settings->ghq_enht_nobg || !rdp.texrecting || (texinfo[id].splits == 1 && texinfo[id].width <= 256)) ext_ghq_txfilter((unsigned char*)texture, (int)real_x, (int)real_y, LOWORD(result), (uint64)g64_crc, &ghqTexInfo); if (ghqTexInfo.data) { if (ghqTexInfo.aspectRatioLog2 < GR_ASPECT_LOG2_1x8 || ghqTexInfo.aspectRatioLog2 > GR_ASPECT_LOG2_8x1 || ghqTexInfo.largeLodLog2 > GR_LOD_LOG2_2048 || ghqTexInfo.largeLodLog2 < GR_LOD_LOG2_1) { /* invalid dimensions */ } else { texture = (uint8_t *)ghqTexInfo.data; lod = ghqTexInfo.largeLodLog2; int splits = cache->splits; if (ghqTexInfo.is_hires_tex) { if (ghqTexInfo.tiles/*ghqTexInfo.untiled_width > max_tex_size*/) { cache->scale = 1.0f; cache->c_off = 0.5f; cache->splits = ghqTexInfo.tiles;//((hirestex.width-1)>>8)+1; cache->splitheight = ghqTexInfo.untiled_height; cache->scale_x = 1.0f; cache->scale_y = float(ghqTexInfo.untiled_height*ghqTexInfo.tiles) / float(ghqTexInfo.width);//*sy; if (splits == 1) { int shift; for (shift = 9; (1 << shift) < ghqTexInfo.untiled_width; shift++); float mult = float(1 << shift >> 8); cache->c_scl_x *= mult; cache->c_scl_y *= mult; } else { int tile_width = rdp.tiles[td].width; if (rdp.timg.set_by == 1) tile_width = rdp.load_info[rdp.tiles[td].t_mem].tex_width; float mult = float(ghqTexInfo.untiled_width / tile_width); cache->c_scl_x *= mult; cache->c_scl_y *= mult; } } else { cache->scale = 256.0f / float(1 << lod); cache->c_off = cache->scale * 0.5f; cache->splits = 1; if (aspect != ghqTexInfo.aspectRatioLog2) { float mscale = float(1 << abs(aspect - ghqTexInfo.aspectRatioLog2)); if (abs(aspect) > abs(ghqTexInfo.aspectRatioLog2)) { cache->c_scl_y *= mscale; cache->c_scl_x *= mscale; } /* else { if (rdp.tiles[td].mirror_s && sup_mirroring) cache->f_mirror_s = TRUE; if (rdp.tiles[td].mirror_t && sup_mirroring) cache->f_mirror_t = TRUE; //cache->c_scl_y /= mscale; //cache->c_scl_x /= mscale; } */ if (ghqTexInfo.aspectRatioLog2 >= 0) { cache->scale_x = 1.0f; cache->scale_y = 1.0f / float(1 << ghqTexInfo.aspectRatioLog2); } else { cache->scale_y = 1.0f; cache->scale_x = 1.0f / float(1 << (-ghqTexInfo.aspectRatioLog2)); } } else if (splits > 1) { cache->c_scl_x /= splits; cache->c_scl_y /= splits; } } if (voodoo.sup_mirroring) { if (rdp.tiles[td].mirror_s && texinfo[id].tile_width == 2 * texinfo[id].width) cache->f_mirror_s = TRUE; else if (texinfo[id].tile_width >= 2 * texinfo[id].width) cache->f_wrap_s = TRUE; if (rdp.tiles[td].mirror_t && texinfo[id].tile_height == 2 * texinfo[id].height) cache->f_mirror_t = TRUE; else if (texinfo[id].tile_height >= 2 * texinfo[id].height) cache->f_wrap_t = TRUE; if (cache->f_mirror_s && cache->f_mirror_t) { cache->c_scl_x *= 2.0f; cache->c_scl_y *= 2.0f; } } aspect = ghqTexInfo.aspectRatioLog2; cache->lod = lod; cache->aspect = aspect; } else { //cache->scale = 256.0f / float(1<c_off = 128.0f / float(1 << lod); } real_x = ghqTexInfo.width; real_y = ghqTexInfo.height; result = (1 << 16) | ghqTexInfo.format; cache->t_info.format = ghqTexInfo.format; cache->realwidth = real_x; cache->realheight = real_y; } } } #endif // Load the texture into texture memory GrTexInfo *t_info = &cache->t_info; t_info->data = texture; t_info->smallLodLog2 = lod; t_info->largeLodLog2 = lod; t_info->aspectRatioLog2 = aspect; uint32_t texture_size = grTexTextureMemRequired(GR_MIPMAPLEVELMASK_BOTH, t_info); // Check for 2mb boundary // Hiroshi Morii required only for V1,Rush, and V2 if (voodoo.has_2mb_tex_boundary && (voodoo.tmem_ptr[tmu] < TEXMEM_2MB_EDGE) && (voodoo.tmem_ptr[tmu] + texture_size > TEXMEM_2MB_EDGE)) { voodoo.tmem_ptr[tmu] = TEXMEM_2MB_EDGE; cache->tmem_addr = voodoo.tmem_ptr[tmu]; } // Check for end of memory (too many textures to fit, clear cache) if (voodoo.tmem_ptr[tmu] + texture_size >= voodoo.tex_max_addr[tmu]) { WriteTrace(TraceRDP, TraceDebug, "Cache size reached, clearing..."); ClearCache(); if (id == 1 && rdp.tex == 3) LoadTex(0, rdp.t0); LoadTex(id, tmu); return; // DON'T CONTINUE (already done) } uint32_t tex_addr = GetTexAddr(tmu, texture_size); grTexDownloadMipMap(tmu, tex_addr, GR_MIPMAPLEVELMASK_BOTH, t_info); grTexSource(tmu, tex_addr, GR_MIPMAPLEVELMASK_BOTH, t_info); } WriteTrace(TraceRDP, TraceDebug, " | | +- LoadTex end"); }