GBA Video: Avoid integer division using reciprocal tricks

This commit is contained in:
Vicki Pfau 2020-11-30 23:15:13 -08:00
parent e1fc8cd912
commit 41a40acefc
2 changed files with 23 additions and 11 deletions

View File

@ -94,6 +94,7 @@ Misc:
- GBA Video: Convert OpenGL VRAM texture to integer - GBA Video: Convert OpenGL VRAM texture to integer
- GBA Video: Skip attempting to render offscreen sprites in OpenGL - GBA Video: Skip attempting to render offscreen sprites in OpenGL
- GBA Video: New GL palette approach, no more batch splitting on palette edits - GBA Video: New GL palette approach, no more batch splitting on palette edits
- GBA Video: Avoid integer division using reciprocal tricks
- Debugger: Keep track of global cycle count - Debugger: Keep track of global cycle count
- FFmpeg: Add looping option for GIF/APNG - FFmpeg: Add looping option for GIF/APNG
- mGUI: Show battery percentage - mGUI: Show battery percentage

View File

@ -53,6 +53,9 @@ struct GBAVideoGLUniform {
}; };
#define PALETTE_ENTRY "#define PALETTE_ENTRY(x) (vec3((ivec3(0x1F, 0x3E0, 0x7C00) & (x)) >> ivec3(0, 5, 10)) / 31.)\n" #define PALETTE_ENTRY "#define PALETTE_ENTRY(x) (vec3((ivec3(0x1F, 0x3E0, 0x7C00) & (x)) >> ivec3(0, 5, 10)) / 31.)\n"
#define MOSAIC \
"#define MOSAIC(LHS, RHS) (((int(LHS) * mosaicTable[RHS]) >> 12) * RHS)\n" \
"const int mosaicTable[17] = int[17](0, 4096, 2048, 1366, 1024, 820, 683, 586, 512, 456, 410, 373, 342, 316, 293, 274, 256);\n"
static const GLchar* const _gles3Header = static const GLchar* const _gles3Header =
"#version 300 es\n" "#version 300 es\n"
@ -117,6 +120,7 @@ static const struct GBAVideoGLUniform _uniformsMode0[] = {
}; };
static const char* const _renderMode0 = static const char* const _renderMode0 =
MOSAIC
"in vec2 texCoord;\n" "in vec2 texCoord;\n"
"uniform isampler2D vram;\n" "uniform isampler2D vram;\n"
"uniform sampler2D palette;\n" "uniform sampler2D palette;\n"
@ -132,10 +136,10 @@ static const char* const _renderMode0 =
"void main() {\n" "void main() {\n"
" ivec2 coord = ivec2(texCoord);\n" " ivec2 coord = ivec2(texCoord);\n"
" if (mosaic.x > 1) {\n" " if (mosaic.x > 1) {\n"
" coord.x -= coord.x % mosaic.x;\n" " coord.x = MOSAIC(coord.x, mosaic.x);\n"
" }\n" " }\n"
" if (mosaic.y > 1) {\n" " if (mosaic.y > 1) {\n"
" coord.y -= coord.y % mosaic.y;\n" " coord.y = MOSAIC(coord.y, mosaic.y);\n"
" }\n" " }\n"
" coord += (ivec2(0x1FF, 0x1FF000) & offset[int(texCoord.y)]) >> ivec2(0, 12);\n" " coord += (ivec2(0x1FF, 0x1FF000) & offset[int(texCoord.y)]) >> ivec2(0, 12);\n"
" ivec2 wrap = ivec2(255, 255);\n" " ivec2 wrap = ivec2(255, 255);\n"
@ -219,6 +223,7 @@ static const char* const _interpolate =
"}\n"; "}\n";
static const char* const _renderMode2 = static const char* const _renderMode2 =
MOSAIC
"in vec2 texCoord;\n" "in vec2 texCoord;\n"
"uniform isampler2D vram;\n" "uniform isampler2D vram;\n"
"uniform sampler2D palette;\n" "uniform sampler2D palette;\n"
@ -253,10 +258,10 @@ static const char* const _renderMode2 =
" ivec2 offset[4];\n" " ivec2 offset[4];\n"
" vec2 incoord = texCoord;\n" " vec2 incoord = texCoord;\n"
" if (mosaic.x > 1) {\n" " if (mosaic.x > 1) {\n"
" incoord.x = floor(incoord.x - float(int(incoord.x) % mosaic.x));\n" " incoord.x = float(MOSAIC(incoord.x, mosaic.x));\n"
" }\n" " }\n"
" if (mosaic.y > 1) {\n" " if (mosaic.y > 1) {\n"
" incoord.y = floor(incoord.y - float(int(incoord.y) % mosaic.y));\n" " incoord.y = float(MOSAIC(incoord.y, mosaic.y));\n"
" }\n" " }\n"
" loadAffine(int(incoord.y), mat, offset);\n" " loadAffine(int(incoord.y), mat, offset);\n"
" float y = fract(incoord.y);\n" " float y = fract(incoord.y);\n"
@ -286,6 +291,7 @@ static const struct GBAVideoGLUniform _uniformsMode35[] = {
}; };
static const char* const _renderMode35 = static const char* const _renderMode35 =
MOSAIC
"in vec2 texCoord;\n" "in vec2 texCoord;\n"
"uniform isampler2D vram;\n" "uniform isampler2D vram;\n"
"uniform int charBase;\n" "uniform int charBase;\n"
@ -303,10 +309,10 @@ static const char* const _renderMode35 =
" ivec2 offset[4];\n" " ivec2 offset[4];\n"
" vec2 incoord = texCoord;\n" " vec2 incoord = texCoord;\n"
" if (mosaic.x > 1) {\n" " if (mosaic.x > 1) {\n"
" incoord.x = floor(incoord.x - float(int(incoord.x) % mosaic.x));\n" " incoord.x = floor(MOSAIC(incoord.x, mosaic.x));\n"
" }\n" " }\n"
" if (mosaic.y > 1) {\n" " if (mosaic.y > 1) {\n"
" incoord.y = floor(incoord.y - float(int(incoord.y) % mosaic.y));\n" " incoord.y = floor(MOSAIC(incoord.y, mosaic.y));\n"
" }\n" " }\n"
" loadAffine(int(incoord.y), mat, offset);\n" " loadAffine(int(incoord.y), mat, offset);\n"
" float y = fract(incoord.y);\n" " float y = fract(incoord.y);\n"
@ -345,6 +351,7 @@ static const struct GBAVideoGLUniform _uniformsMode4[] = {
}; };
static const char* const _renderMode4 = static const char* const _renderMode4 =
MOSAIC
"in vec2 texCoord;\n" "in vec2 texCoord;\n"
"uniform isampler2D vram;\n" "uniform isampler2D vram;\n"
"uniform sampler2D palette;\n" "uniform sampler2D palette;\n"
@ -363,10 +370,10 @@ static const char* const _renderMode4 =
" ivec2 offset[4];\n" " ivec2 offset[4];\n"
" vec2 incoord = texCoord;\n" " vec2 incoord = texCoord;\n"
" if (mosaic.x > 1) {\n" " if (mosaic.x > 1) {\n"
" incoord.x = floor(incoord.x - float(int(incoord.x) % mosaic.x));\n" " incoord.x = floor(MOSAIC(incoord.x, mosaic.x));\n"
" }\n" " }\n"
" if (mosaic.y > 1) {\n" " if (mosaic.y > 1) {\n"
" incoord.y = floor(incoord.y - float(int(incoord.y) % mosaic.y));\n" " incoord.y = floor(MOSAIC(incoord.y, mosaic.y));\n"
" }\n" " }\n"
" loadAffine(int(incoord.y), mat, offset);\n" " loadAffine(int(incoord.y), mat, offset);\n"
" float y = fract(incoord.y);\n" " float y = fract(incoord.y);\n"
@ -412,6 +419,7 @@ static const struct GBAVideoGLUniform _uniformsObj[] = {
}; };
static const char* const _renderObj = static const char* const _renderObj =
MOSAIC
"in vec2 texCoord;\n" "in vec2 texCoord;\n"
"uniform isampler2D vram;\n" "uniform isampler2D vram;\n"
"uniform sampler2D palette;\n" "uniform sampler2D palette;\n"
@ -434,17 +442,20 @@ static const char* const _renderObj =
" vec2 incoord = texCoord;\n" " vec2 incoord = texCoord;\n"
" if (mosaic.x > 1) {\n" " if (mosaic.x > 1) {\n"
" int x = int(incoord.x);\n" " int x = int(incoord.x);\n"
" incoord.x = float(clamp(x - (mosaic.z + x) % mosaic.x, 0, dims.z - 1));\n" " x = MOSAIC(mosaic.z + x, mosaic.x) - mosaic.z;\n"
" incoord.x = float(clamp(x, 0, dims.z - 1));\n"
" } else if (mosaic.x < -1) {\n" " } else if (mosaic.x < -1) {\n"
" int x = dims.z - int(incoord.x) - 1;\n" " int x = dims.z - int(incoord.x) - 1;\n"
" incoord.x = float(clamp(dims.z - x + (mosaic.z + x) % -mosaic.x - 1, 0, dims.z - 1));\n" " x = dims.z - MOSAIC(mosaic.z + x, -mosaic.x) + mosaic.z - 1;\n"
" incoord.x = float(clamp(x, 0, dims.z - 1));\n"
" }\n" " }\n"
" if (cyclesRemaining[int(incoord.y) + mosaic.w] <= 0) {\n" " if (cyclesRemaining[int(incoord.y) + mosaic.w] <= 0) {\n"
" discard;\n" " discard;\n"
" }\n" " }\n"
" if (mosaic.y > 1) {\n" " if (mosaic.y > 1) {\n"
" int y = int(incoord.y);\n" " int y = int(incoord.y);\n"
" incoord.y = float(clamp(y - (mosaic.w + y) % mosaic.y, 0, dims.w - 1));\n" " y = MOSAIC(mosaic.w + y, mosaic.y) - mosaic.w;"
" incoord.y = float(clamp(y, 0, dims.w - 1));\n"
" }\n" " }\n"
" ivec2 coord = ivec2(transform * (incoord - vec2(dims.zw) / 2.) + vec2(dims.xy) / 2.);\n" " ivec2 coord = ivec2(transform * (incoord - vec2(dims.zw) / 2.) + vec2(dims.xy) / 2.);\n"
" if ((coord & ~(dims.xy - 1)) != ivec2(0, 0)) {\n" " if ((coord & ~(dims.xy - 1)) != ivec2(0, 0)) {\n"