From 59980ba1c71e32a886fc04c849b6442452f276d1 Mon Sep 17 00:00:00 2001 From: Matt Borgerson Date: Sat, 14 Nov 2020 16:15:17 -0700 Subject: [PATCH] nv2a: Refactor BUMPENVMAP[_LUM] --- hw/xbox/nv2a/pgraph.c | 40 +++++++++++++++--------- hw/xbox/nv2a/psh.c | 72 +++++++++++++++++++++---------------------- hw/xbox/nv2a/psh.h | 2 +- 3 files changed, 61 insertions(+), 53 deletions(-) diff --git a/hw/xbox/nv2a/pgraph.c b/hw/xbox/nv2a/pgraph.c index ba9578d01d..803c24b51a 100644 --- a/hw/xbox/nv2a/pgraph.c +++ b/hw/xbox/nv2a/pgraph.c @@ -3305,27 +3305,37 @@ static void pgraph_bind_shaders(PGRAPHState *pg) } for (i = 0; i < 4; i++) { - state.psh.rect_tex[i] = false; - bool enabled = pg->regs[NV_PGRAPH_TEXCTL0_0 + i*4] - & NV_PGRAPH_TEXCTL0_0_ENABLE; - unsigned int color_format = - GET_MASK(pg->regs[NV_PGRAPH_TEXFMT0 + i*4], - NV_PGRAPH_TEXFMT0_COLOR); - - /* This is needed to detect cases where the wrong format for ds/dt textures is used - * and a remapping of the unsigned values to signed is needed (e.g. the boost dash in JSRF) */ - state.psh.dsdt_tex[i] = kelvin_color_format_map[color_format].gl_type == GL_BYTE; - - if (enabled && kelvin_color_format_map[color_format].linear) { - state.psh.rect_tex[i] = true; - } - for (j = 0; j < 4; j++) { state.psh.compare_mode[i][j] = (pg->regs[NV_PGRAPH_SHADERCLIPMODE] >> (4 * i + j)) & 1; } state.psh.alphakill[i] = pg->regs[NV_PGRAPH_TEXCTL0_0 + i*4] & NV_PGRAPH_TEXCTL0_0_ALPHAKILLEN; + + bool enabled = pg->regs[NV_PGRAPH_TEXCTL0_0 + i*4] + & NV_PGRAPH_TEXCTL0_0_ENABLE; + if (!enabled) { + continue; + } + + unsigned int color_format = + GET_MASK(pg->regs[NV_PGRAPH_TEXFMT0 + i*4], + NV_PGRAPH_TEXFMT0_COLOR); + ColorFormatInfo f = kelvin_color_format_map[color_format]; + state.psh.rect_tex[i] = f.linear; + + /* Keep track of whether texture data has been loaded as signed + * normalized integers or not. This dictates whether or not we will need + * to re-map in fragment shader for certain texture modes (e.g. + * bumpenvmap). + * + * FIXME: When signed texture data is loaded as unsigned and remapped in + * fragment shader, there may be interpolation artifacts. Fix this to + * support signed textures more appropriately. + */ + state.psh.snorm_tex[i] = (f.gl_internal_format == GL_RGB8_SNORM) + || (f.gl_internal_format == GL_RG8_SNORM); + } ShaderBinding* cached_shader = (ShaderBinding*)g_hash_table_lookup(pg->shader_cache, &state); diff --git a/hw/xbox/nv2a/psh.c b/hw/xbox/nv2a/psh.c index 4dc810350c..8c75e12762 100644 --- a/hw/xbox/nv2a/psh.c +++ b/hw/xbox/nv2a/psh.c @@ -560,6 +560,10 @@ static QString* psh_convert(struct PixelShader *ps) " if (x >= 128.0) return (x-256.0)/127.0;\n" " else return (x)/127.0;\n" "}\n" + "float sign3_to_0_to_1(float x) {\n" + " if (x >= 0) return x/2;\n" + " else return 1+x/2;\n" + "}\n" "vec3 dotmap_zero_to_one(vec3 col) {\n" " return col;\n" "}\n" @@ -685,55 +689,49 @@ static QString* psh_convert(struct PixelShader *ps) } case PS_TEXTUREMODES_BUMPENVMAP: assert(i >= 1); - - if (!ps->state.dsdt_tex[ps->input_tex[i]]) { - /* Fix for cases using improper formats for the ds/dt offset texture, - * like the boost dash effect in JSRF */ - /* FIXME: Figure out why the green and blue channels arrive reversed */ - qstring_append_fmt(vars, "t%d.bg = dotmap_minus1_to_1_gl(t%d.rgb).gb;\n", - ps->input_tex[i], ps->input_tex[i]); - } - sampler_type = ps->state.rect_tex[i] ? "sampler2DRect" : "sampler2D"; qstring_append_fmt(preflight, "uniform mat2 bumpMat%d;\n", i); - /* FIXME: Do bumpMat swizzle on CPU before upload */ - qstring_append_fmt(vars, "t%d.gb = mat2(bumpMat%d[0].xy, bumpMat%d[1].yx) * t%d.gb;\n", - ps->input_tex[i], i, i, ps->input_tex[i]); + if (ps->state.snorm_tex[ps->input_tex[i]]) { + /* Input color channels already signed (FIXME: May not always want signed textures in this case) */ + qstring_append_fmt(vars, "vec2 dsdt%d = t%d.bg;\n", + i, ps->input_tex[i]); + } else { + /* Convert to signed (FIXME: loss of accuracy due to filtering/interpolation) */ + qstring_append_fmt(vars, "vec2 dsdt%d = vec2(sign3(t%d.b), sign3(t%d.g));\n", + i, ps->input_tex[i], ps->input_tex[i]); + } - qstring_append_fmt(vars, "vec4 t%d = texture(texSamp%d, pT%d.xy + t%d.gb);\n", - i, i, i, ps->input_tex[i]); + /* FIXME: Do bumpMat swizzle on CPU before upload */ + qstring_append_fmt(vars, "dsdt%d = mat2(bumpMat%d[0].xy, bumpMat%d[1].yx) * dsdt%d;\n", + i, i, i, i); + qstring_append_fmt(vars, "vec4 t%d = texture(texSamp%d, pT%d.xy + dsdt%d);\n", + i, i, i, i); break; case PS_TEXTUREMODES_BUMPENVMAP_LUM: assert(i >= 1); - + sampler_type = ps->state.rect_tex[i] ? "sampler2DRect" : "sampler2D"; qstring_append_fmt(preflight, "uniform float bumpScale%d;\n", i); qstring_append_fmt(preflight, "uniform float bumpOffset%d;\n", i); - - if (!ps->state.dsdt_tex[ps->input_tex[i]]) { - /* Fix for cases using improper texture formats for the ds/dt offset texture */ - /* FIXME: Figure out why the channels arrive reversed */ - qstring_append_fmt(vars, "t%d.gbr = vec3(dotmap_minus1_to_1_gl(t%d.abg).gb, t%d.r);\n", - ps->input_tex[i], ps->input_tex[i], ps->input_tex[i]); - } else { - /* FIXME: Figure out why the green and blue channels arrive reversed */ - qstring_append_fmt(vars, "t%d.rgb = vec3(t%d.rbg);\n", - ps->input_tex[i], ps->input_tex[i]); - } - - /* Now the same as BUMPENVMAP */ - sampler_type = ps->state.rect_tex[i] ? "sampler2DRect" : "sampler2D"; qstring_append_fmt(preflight, "uniform mat2 bumpMat%d;\n", i); + if (ps->state.snorm_tex[ps->input_tex[i]]) { + /* Input color channels already signed (FIXME: May not always want signed textures in this case) */ + qstring_append_fmt(vars, "vec3 dsdtl%d = vec3(t%d.bg, sign3_to_0_to_1(t%d.r));\n", + i, ps->input_tex[i], ps->input_tex[i]); + } else { + /* Convert to signed (FIXME: loss of accuracy due to filtering/interpolation) */ + qstring_append_fmt(vars, "vec3 dsdtl%d = vec3(sign3(t%d.b), sign3(t%d.g), t%d.r);\n", + i, ps->input_tex[i], ps->input_tex[i], ps->input_tex[i]); + } + /* FIXME: Do bumpMat swizzle on CPU before upload */ - qstring_append_fmt(vars, "t%d.gb = mat2(bumpMat%d[0].xy, bumpMat%d[1].yx) * t%d.gb;\n", - ps->input_tex[i], i, i, ps->input_tex[i]); - - qstring_append_fmt(vars, "vec4 t%d = texture(texSamp%d, pT%d.xy + t%d.gb);\n", - i, i, i, ps->input_tex[i]); - - qstring_append_fmt(vars, "t%d = t%d * (bumpScale%d * t%d.r + bumpOffset%d);\n", - i, i, i, ps->input_tex[i], i); + qstring_append_fmt(vars, "dsdtl%d.st = mat2(bumpMat%d[0].xy, bumpMat%d[1].yx) * dsdtl%d.st;\n", + i, i, i, i); + qstring_append_fmt(vars, "vec4 t%d = texture(texSamp%d, pT%d.xy + dsdtl%d.st);\n", + i, i, i, i); + qstring_append_fmt(vars, "t%d = t%d * (bumpScale%d * dsdtl%d.p + bumpOffset%d);\n", + i, i, i, i, i); break; case PS_TEXTUREMODES_BRDF: assert(i >= 2); diff --git a/hw/xbox/nv2a/psh.h b/hw/xbox/nv2a/psh.h index 29bf5809ab..1d7ed357c0 100644 --- a/hw/xbox/nv2a/psh.h +++ b/hw/xbox/nv2a/psh.h @@ -45,7 +45,7 @@ typedef struct PshState { uint32_t alpha_inputs[8], alpha_outputs[8]; bool rect_tex[4]; - bool dsdt_tex[4]; + bool snorm_tex[4]; bool compare_mode[4][4]; bool alphakill[4];