flycast/core/rend/gles/gles.cpp

1521 lines
40 KiB
C++
Raw Normal View History

2019-09-07 12:37:39 +00:00
#include <cmath>
#include "glcache.h"
2019-10-19 16:34:24 +00:00
#include "gles.h"
2013-12-19 17:10:14 +00:00
#include "rend/TexCache.h"
2019-02-06 18:57:13 +00:00
#include "rend/gui.h"
#include "wsi/gl_context.h"
#include "cfg/cfg.h"
#include "rend/osd.h"
2013-12-19 17:10:14 +00:00
#ifdef GLES
2018-10-28 23:31:24 +00:00
#ifndef GL_RED
#define GL_RED 0x1903
#endif
#ifndef GL_MAJOR_VERSION
#define GL_MAJOR_VERSION 0x821B
#endif
#endif
2019-09-04 16:40:18 +00:00
#include <png.h>
2013-12-19 17:10:14 +00:00
#include "oslib/oslib.h"
#include "rend/rend.h"
#include "input/gamepad.h"
#include <glm/gtx/transform.hpp>
2013-12-19 17:10:14 +00:00
float fb_scale_x, fb_scale_y; // FIXME
2013-12-19 17:10:14 +00:00
//Fragment and vertex shaders code
const char* VertexShaderSource =
"\
%s \n\
#define TARGET_GL %s \n\
2018-07-01 18:25:06 +00:00
#define pp_Gouraud %d \n\
\n\
#define GLES2 0 \n\
#define GLES3 1 \n\
#define GL2 2 \n\
#define GL3 3 \n\
\n\
#if TARGET_GL == GL2 \n\
#define highp \n\
#define lowp \n\
#define mediump \n\
#endif \n\
#if TARGET_GL == GLES2 || TARGET_GL == GL2 \n\
#define in attribute \n\
#define out varying \n\
#endif \n\
\n\
\n\
#if TARGET_GL == GL3 || TARGET_GL == GLES3 \n\
2018-07-01 18:25:06 +00:00
#if pp_Gouraud == 0 \n\
#define INTERPOLATION flat \n\
#else \n\
#define INTERPOLATION smooth \n\
#endif \n\
#else \n\
#define INTERPOLATION \n\
#endif \n\
\n\
2013-12-19 17:10:14 +00:00
/* Vertex constants*/ \n\
uniform highp vec4 scale; \n\
uniform highp vec4 depth_scale; \n\
uniform highp mat4 normal_matrix; \n\
/* Vertex input */ \n\
in highp vec4 in_pos; \n\
in lowp vec4 in_base; \n\
in lowp vec4 in_offs; \n\
in mediump vec2 in_uv; \n\
/* output */ \n\
INTERPOLATION out lowp vec4 vtx_base; \n\
INTERPOLATION out lowp vec4 vtx_offs; \n\
out mediump vec2 vtx_uv; \n\
2013-12-19 17:10:14 +00:00
void main() \n\
{ \n\
vtx_base = in_base; \n\
vtx_offs = in_offs; \n\
vtx_uv = in_uv; \n\
highp vec4 vpos = in_pos; \n\
if (vpos.z < 0.0 || vpos.z > 3.4e37) \n\
{ \n\
gl_Position = vec4(0.0, 0.0, 1.0, 1.0 / vpos.z); \n\
return; \n\
} \n\
\n\
vpos = normal_matrix * vpos; \n\
vpos.w = 1.0 / vpos.z; \n\
#if TARGET_GL != GLES2 \n\
vpos.z = vpos.w; \n\
#else \n\
vpos.z = depth_scale.x + depth_scale.y * vpos.w; \n\
#endif \n\
vpos.xy *= vpos.w; \n\
2013-12-19 17:10:14 +00:00
gl_Position = vpos; \n\
}";
const char* PixelPipelineShader =
"\
%s \n\
#define TARGET_GL %s \n\
\n\
2013-12-19 17:10:14 +00:00
#define cp_AlphaTest %d \n\
#define pp_ClipTestMode %d \n\
2013-12-19 17:10:14 +00:00
#define pp_UseAlpha %d \n\
#define pp_Texture %d \n\
#define pp_IgnoreTexA %d \n\
#define pp_ShadInstr %d \n\
#define pp_Offset %d \n\
#define pp_FogCtrl %d \n\
2018-07-01 18:25:06 +00:00
#define pp_Gouraud %d \n\
2018-07-02 13:23:47 +00:00
#define pp_BumpMap %d \n\
2018-09-01 10:56:37 +00:00
#define FogClamping %d \n\
#define pp_TriLinear %d \n\
2018-07-02 13:23:47 +00:00
#define PI 3.1415926 \n\
\n\
#define GLES2 0 \n\
#define GLES3 1 \n\
#define GL2 2 \n\
#define GL3 3 \n\
\n\
#if TARGET_GL == GL2 \n\
#define highp \n\
#define lowp \n\
#define mediump \n\
#endif \n\
#if TARGET_GL == GLES3 \n\
out highp vec4 FragColor; \n\
#define gl_FragColor FragColor \n\
2018-10-28 23:31:24 +00:00
#define FOG_CHANNEL a \n\
#elif TARGET_GL == GL3 \n\
out highp vec4 FragColor; \n\
#define gl_FragColor FragColor \n\
2018-10-28 23:31:24 +00:00
#define FOG_CHANNEL r \n\
#else \n\
#define in varying \n\
#define texture texture2D \n\
2018-10-28 23:31:24 +00:00
#define FOG_CHANNEL a \n\
#endif \n\
\n\
\n\
#if TARGET_GL == GL3 || TARGET_GL == GLES3 \n\
2018-07-01 18:25:06 +00:00
#if pp_Gouraud == 0 \n\
#define INTERPOLATION flat \n\
#else \n\
#define INTERPOLATION smooth \n\
#endif \n\
#else \n\
#define INTERPOLATION \n\
#endif \n\
\n\
2013-12-19 17:10:14 +00:00
/* Shader program params*/ \n\
/* gles has no alpha test stage, so its emulated on the shader */ \n\
uniform lowp float cp_AlphaTestValue; \n\
uniform lowp vec4 pp_ClipTest; \n\
uniform lowp vec3 sp_FOG_COL_RAM,sp_FOG_COL_VERT; \n\
2018-10-28 23:31:24 +00:00
uniform highp float sp_FOG_DENSITY; \n\
2013-12-19 17:10:14 +00:00
uniform sampler2D tex,fog_table; \n\
uniform lowp float trilinear_alpha; \n\
2018-09-01 10:56:37 +00:00
uniform lowp vec4 fog_clamp_min; \n\
uniform lowp vec4 fog_clamp_max; \n\
uniform highp float extra_depth_scale; \n\
2013-12-19 17:10:14 +00:00
/* Vertex input*/ \n\
INTERPOLATION in lowp vec4 vtx_base; \n\
INTERPOLATION in lowp vec4 vtx_offs; \n\
in mediump vec2 vtx_uv; \n\
2018-09-01 10:56:37 +00:00
\n\
2018-10-28 23:31:24 +00:00
lowp float fog_mode2(highp float w) \n\
2013-12-19 17:10:14 +00:00
{ \n\
highp float z = clamp(w * extra_depth_scale * sp_FOG_DENSITY, 1.0, 255.9999); \n\
2018-10-28 23:31:24 +00:00
highp float exp = floor(log2(z)); \n\
highp float m = z * 16.0 / pow(2.0, exp) - 16.0; \n\
lowp float idx = floor(m) + exp * 16.0 + 0.5; \n\
highp vec4 fog_coef = texture(fog_table, vec2(idx / 128.0, 0.75 - (m - floor(m)) / 2.0)); \n\
return fog_coef.FOG_CHANNEL; \n\
2013-12-19 17:10:14 +00:00
} \n\
2018-09-01 10:56:37 +00:00
\n\
highp vec4 fog_clamp(lowp vec4 col) \n\
2018-09-01 10:56:37 +00:00
{ \n\
#if FogClamping == 1 \n\
return clamp(col, fog_clamp_min, fog_clamp_max); \n\
#else \n\
return col; \n\
#endif \n\
} \n\
\n\
2013-12-19 17:10:14 +00:00
void main() \n\
{ \n\
// Clip outside the box \n\
#if pp_ClipTestMode==1 \n\
if (gl_FragCoord.x < pp_ClipTest.x || gl_FragCoord.x > pp_ClipTest.z \n\
|| gl_FragCoord.y < pp_ClipTest.y || gl_FragCoord.y > pp_ClipTest.w) \n\
discard; \n\
#endif \n\
// Clip inside the box \n\
#if pp_ClipTestMode==-1 \n\
if (gl_FragCoord.x >= pp_ClipTest.x && gl_FragCoord.x <= pp_ClipTest.z \n\
&& gl_FragCoord.y >= pp_ClipTest.y && gl_FragCoord.y <= pp_ClipTest.w) \n\
discard; \n\
#endif \n\
\n\
2013-12-19 17:10:14 +00:00
lowp vec4 color=vtx_base; \n\
#if pp_UseAlpha==0 \n\
color.a=1.0; \n\
#endif\n\
#if pp_FogCtrl==3 \n\
2018-10-28 23:31:24 +00:00
color=vec4(sp_FOG_COL_RAM.rgb,fog_mode2(gl_FragCoord.w)); \n\
2013-12-19 17:10:14 +00:00
#endif\n\
#if pp_Texture==1 \n\
{ \n\
lowp vec4 texcol=texture(tex, vtx_uv); \n\
2018-07-02 13:23:47 +00:00
\n\
#if pp_BumpMap == 1 \n\
highp float s = PI / 2.0 * (texcol.a * 15.0 * 16.0 + texcol.r * 15.0) / 255.0; \n\
highp float r = 2.0 * PI * (texcol.g * 15.0 * 16.0 + texcol.b * 15.0) / 255.0; \n\
2018-07-02 13:23:47 +00:00
texcol.a = clamp(vtx_offs.a + vtx_offs.r * sin(s) + vtx_offs.g * cos(s) * cos(r - 2.0 * PI * vtx_offs.b), 0.0, 1.0); \n\
texcol.rgb = vec3(1.0, 1.0, 1.0); \n\
#else\n\
#if pp_IgnoreTexA==1 \n\
texcol.a=1.0; \n\
#endif\n\
\n\
#if cp_AlphaTest == 1 \n\
if (cp_AlphaTestValue > texcol.a) \n\
discard; \n\
#endif \n\
2018-07-02 13:23:47 +00:00
#endif \n\
2013-12-19 17:10:14 +00:00
#if pp_ShadInstr==0 \n\
{ \n\
color=texcol; \n\
2013-12-19 17:10:14 +00:00
} \n\
#endif\n\
#if pp_ShadInstr==1 \n\
{ \n\
color.rgb*=texcol.rgb; \n\
color.a=texcol.a; \n\
} \n\
#endif\n\
#if pp_ShadInstr==2 \n\
{ \n\
color.rgb=mix(color.rgb,texcol.rgb,texcol.a); \n\
} \n\
#endif\n\
#if pp_ShadInstr==3 \n\
{ \n\
color*=texcol; \n\
} \n\
#endif\n\
\n\
2018-07-02 13:23:47 +00:00
#if pp_Offset==1 && pp_BumpMap == 0 \n\
2013-12-19 17:10:14 +00:00
{ \n\
color.rgb+=vtx_offs.rgb; \n\
} \n\
#endif\n\
} \n\
#endif\n\
\n\
color = fog_clamp(color); \n\
\n\
#if pp_FogCtrl == 0 \n\
2013-12-19 17:10:14 +00:00
{ \n\
2018-10-28 23:31:24 +00:00
color.rgb=mix(color.rgb,sp_FOG_COL_RAM.rgb,fog_mode2(gl_FragCoord.w)); \n\
2013-12-19 17:10:14 +00:00
} \n\
#endif\n\
#if pp_FogCtrl == 1 && pp_Offset==1 && pp_BumpMap == 0 \n\
{ \n\
color.rgb=mix(color.rgb,sp_FOG_COL_VERT.rgb,vtx_offs.a); \n\
} \n\
#endif\n\
\n\
#if pp_TriLinear == 1 \n\
color *= trilinear_alpha; \n\
#endif \n\
\n\
2013-12-19 17:10:14 +00:00
#if cp_AlphaTest == 1 \n\
color.a=1.0; \n\
2013-12-19 17:10:14 +00:00
#endif \n\
//color.rgb=vec3(gl_FragCoord.w * sp_FOG_DENSITY / 128.0);\n\
#if TARGET_GL != GLES2 \n\
highp float w = gl_FragCoord.w * 100000.0; \n\
gl_FragDepth = log2(1.0 + w) / 34.0; \n\
#endif \n\
gl_FragColor =color; \n\
2013-12-19 17:10:14 +00:00
}";
const char* ModifierVolumeShader =
"\
%s \n\
#define TARGET_GL %s \n\
\n\
#define GLES2 0 \n\
#define GLES3 1 \n\
#define GL2 2 \n\
#define GL3 3 \n\
\n\
#if TARGET_GL == GL2 \n\
#define highp \n\
#define lowp \n\
#define mediump \n\
#endif \n\
#if TARGET_GL != GLES2 && TARGET_GL != GL2 \n\
out highp vec4 FragColor; \n\
#define gl_FragColor FragColor \n\
#endif \n\
\n\
2013-12-19 17:10:14 +00:00
uniform lowp float sp_ShaderColor; \n\
/* Vertex input*/ \n\
void main() \n\
{ \n\
#if TARGET_GL != GLES2 \n\
highp float w = gl_FragCoord.w * 100000.0; \n\
gl_FragDepth = log2(1.0 + w) / 34.0; \n\
#endif \n\
gl_FragColor=vec4(0.0, 0.0, 0.0, sp_ShaderColor); \n\
2013-12-19 17:10:14 +00:00
}";
const char* OSD_VertexShader =
"\
%s \n\
#define TARGET_GL %s \n\
\n\
#define GLES2 0 \n\
#define GLES3 1 \n\
#define GL2 2 \n\
#define GL3 3 \n\
\n\
#if TARGET_GL == GL2 \n\
#define highp \n\
#define lowp \n\
#define mediump \n\
#endif \n\
#if TARGET_GL == GLES2 || TARGET_GL == GL2 \n\
#define in attribute \n\
#define out varying \n\
#endif \n\
\n\
uniform highp vec4 scale; \n\
\n\
in highp vec4 in_pos; \n\
in lowp vec4 in_base; \n\
in mediump vec2 in_uv; \n\
\n\
out lowp vec4 vtx_base; \n\
out mediump vec2 vtx_uv; \n\
\n\
void main() \n\
{ \n\
vtx_base = in_base; \n\
vtx_uv = in_uv; \n\
highp vec4 vpos = in_pos; \n\
\n\
vpos.w = 1.0; \n\
vpos.z = vpos.w; \n\
vpos.xy = vpos.xy * scale.xy - scale.zw; \n\
gl_Position = vpos; \n\
}";
const char* OSD_Shader =
"\
%s \n\
#define TARGET_GL %s \n\
\n\
#define GLES2 0 \n\
#define GLES3 1 \n\
#define GL2 2 \n\
#define GL3 3 \n\
\n\
#if TARGET_GL == GL2 \n\
#define highp \n\
#define lowp \n\
#define mediump \n\
#endif \n\
#if TARGET_GL != GLES2 && TARGET_GL != GL2 \n\
out highp vec4 FragColor; \n\
#define gl_FragColor FragColor \n\
#else \n\
#define in varying \n\
#define texture texture2D \n\
#endif \n\
\n\
in lowp vec4 vtx_base; \n\
in mediump vec2 vtx_uv; \n\
\n\
2013-12-19 17:10:14 +00:00
uniform sampler2D tex; \n\
void main() \n\
{ \n\
gl_FragColor = vtx_base * texture(tex, vtx_uv); \n\
2013-12-19 17:10:14 +00:00
}";
GLCache glcache;
2013-12-19 17:10:14 +00:00
gl_ctx gl;
int screen_width;
int screen_height;
2018-06-05 10:18:09 +00:00
GLuint fogTextureId;
glm::mat4 ViewportMatrix;
#ifdef TEST_AUTOMATION
static void dump_screenshot(u8 *buffer, u32 width, u32 height)
{
FILE *fp = fopen("screenshot.png", "wb");
if (fp == NULL)
{
ERROR_LOG(RENDERER, "Failed to open screenshot.png for writing\n");
return;
}
png_bytepp rows = (png_bytepp)malloc(height * sizeof(png_bytep));
for (int y = 0; y < height; y++)
{
rows[height - y - 1] = (png_bytep)buffer + y * width * 3;
}
png_structp png_ptr = png_create_write_struct(PNG_LIBPNG_VER_STRING, NULL, NULL, NULL);
png_infop info_ptr = png_create_info_struct(png_ptr);
png_init_io(png_ptr, fp);
// write header
png_set_IHDR(png_ptr, info_ptr, width, height,
8, PNG_COLOR_TYPE_RGB, PNG_INTERLACE_NONE,
PNG_COMPRESSION_TYPE_BASE, PNG_FILTER_TYPE_BASE);
png_write_info(png_ptr, info_ptr);
// write bytes
png_write_image(png_ptr, rows);
// end write
png_write_end(png_ptr, NULL);
fclose(fp);
free(rows);
}
void do_swap_automation()
{
static FILE* video_file = fopen(cfgLoadStr("record", "rawvid","").c_str(), "wb");
extern bool do_screenshot;
if (video_file)
{
int bytesz = screen_width * screen_height * 3;
u8* img = new u8[bytesz];
glReadPixels(0, 0, screen_width, screen_height, GL_RGB, GL_UNSIGNED_BYTE, img);
fwrite(img, 1, bytesz, video_file);
fflush(video_file);
}
if (do_screenshot)
{
extern void dc_exit();
int bytesz = screen_width * screen_height * 3;
u8* img = new u8[bytesz];
glReadPixels(0, 0, screen_width, screen_height, GL_RGB, GL_UNSIGNED_BYTE, img);
dump_screenshot(img, screen_width, screen_height);
delete[] img;
dc_exit();
exit(0);
}
}
#endif
static void gl_delete_shaders()
{
for (auto it : gl.shaders)
{
if (it.second.program != 0)
glcache.DeleteProgram(it.second.program);
}
gl.shaders.clear();
glcache.DeleteProgram(gl.modvol_shader.program);
gl.modvol_shader.program = 0;
}
static void gles_term()
2019-02-17 23:38:11 +00:00
{
glDeleteBuffers(1, &gl.vbo.geometry);
gl.vbo.geometry = 0;
glDeleteBuffers(1, &gl.vbo.modvols);
glDeleteBuffers(1, &gl.vbo.idxs);
glDeleteBuffers(1, &gl.vbo.idxs2);
glcache.DeleteTextures(1, &fbTextureId);
fbTextureId = 0;
glcache.DeleteTextures(1, &fogTextureId);
fogTextureId = 0;
gl_free_osd_resources();
free_output_framebuffer();
gl_delete_shaders();
}
2013-12-19 17:10:14 +00:00
void findGLVersion()
{
gl.index_type = GL_UNSIGNED_INT;
2019-10-19 16:34:24 +00:00
gl.gl_major = theGLContext.GetMajorVersion();
gl.is_gles = theGLContext.IsGLES();
if (gl.is_gles)
{
if (gl.gl_major >= 3)
{
gl.gl_version = "GLES3";
gl.glsl_version_header = "#version 300 es";
}
else
{
gl.gl_version = "GLES2";
gl.glsl_version_header = "";
gl.index_type = GL_UNSIGNED_SHORT;
}
2018-10-28 23:31:24 +00:00
gl.fog_image_format = GL_ALPHA;
const char *extensions = (const char *)glGetString(GL_EXTENSIONS);
if (strstr(extensions, "GL_OES_packed_depth_stencil") != NULL)
gl.GL_OES_packed_depth_stencil_supported = true;
if (strstr(extensions, "GL_OES_depth24") != NULL)
gl.GL_OES_depth24_supported = true;
if (!gl.GL_OES_packed_depth_stencil_supported)
INFO_LOG(RENDERER, "Packed depth/stencil not supported: no modifier volumes when rendering to a texture");
}
else
{
if (gl.gl_major >= 3)
{
gl.gl_version = "GL3";
2018-10-30 10:48:44 +00:00
#if HOST_OS == OS_DARWIN
gl.glsl_version_header = "#version 150";
#else
gl.glsl_version_header = "#version 130";
2018-10-30 10:48:44 +00:00
#endif
2018-10-28 23:31:24 +00:00
gl.fog_image_format = GL_RED;
}
else
{
gl.gl_version = "GL2";
gl.glsl_version_header = "#version 120";
2018-10-28 23:31:24 +00:00
gl.fog_image_format = GL_ALPHA;
}
}
}
struct ShaderUniforms_t ShaderUniforms;
2013-12-19 17:10:14 +00:00
GLuint gl_CompileShader(const char* shader,GLuint type)
{
GLint result;
GLint compile_log_len;
GLuint rv=glCreateShader(type);
glShaderSource(rv, 1,&shader, NULL);
glCompileShader(rv);
//lets see if it compiled ...
glGetShaderiv(rv, GL_COMPILE_STATUS, &result);
glGetShaderiv(rv, GL_INFO_LOG_LENGTH, &compile_log_len);
if (!result && compile_log_len>0)
{
char* compile_log=(char*)malloc(compile_log_len);
*compile_log=0;
glGetShaderInfoLog(rv, compile_log_len, &compile_log_len, compile_log);
WARN_LOG(RENDERER, "Shader: %s \n%s", result ? "compiled!" : "failed to compile", compile_log);
2013-12-19 17:10:14 +00:00
free(compile_log);
}
return rv;
}
GLuint gl_CompileAndLink(const char* VertexShader, const char* FragmentShader)
{
//create shaders
GLuint vs=gl_CompileShader(VertexShader ,GL_VERTEX_SHADER);
GLuint ps=gl_CompileShader(FragmentShader ,GL_FRAGMENT_SHADER);
GLuint program = glCreateProgram();
glAttachShader(program, vs);
glAttachShader(program, ps);
//bind vertex attribute to vbo inputs
glBindAttribLocation(program, VERTEX_POS_ARRAY, "in_pos");
glBindAttribLocation(program, VERTEX_COL_BASE_ARRAY, "in_base");
glBindAttribLocation(program, VERTEX_COL_OFFS_ARRAY, "in_offs");
glBindAttribLocation(program, VERTEX_UV_ARRAY, "in_uv");
2018-10-04 08:29:23 +00:00
glBindAttribLocation(program, VERTEX_COL_BASE1_ARRAY, "in_base1");
glBindAttribLocation(program, VERTEX_COL_OFFS1_ARRAY, "in_offs1");
glBindAttribLocation(program, VERTEX_UV1_ARRAY, "in_uv1");
2013-12-19 17:10:14 +00:00
#ifdef glBindFragDataLocation
if (!gl.is_gles && gl.gl_major >= 3)
glBindFragDataLocation(program, 0, "FragColor");
#endif
2013-12-19 17:10:14 +00:00
glLinkProgram(program);
GLint result;
glGetProgramiv(program, GL_LINK_STATUS, &result);
GLint compile_log_len;
glGetProgramiv(program, GL_INFO_LOG_LENGTH, &compile_log_len);
if (!result && compile_log_len>0)
{
compile_log_len+= 1024;
2013-12-19 17:10:14 +00:00
char* compile_log=(char*)malloc(compile_log_len);
*compile_log=0;
glGetProgramInfoLog(program, compile_log_len, &compile_log_len, compile_log);
WARN_LOG(RENDERER, "Shader linking: %s \n (%d bytes), - %s -", result ? "linked" : "failed to link", compile_log_len, compile_log);
2013-12-19 17:10:14 +00:00
free(compile_log);
2018-07-16 14:52:11 +00:00
// Dump the shaders source for troubleshooting
INFO_LOG(RENDERER, "// VERTEX SHADER\n%s\n// END", VertexShader);
INFO_LOG(RENDERER, "// FRAGMENT SHADER\n%s\n// END", FragmentShader);
2013-12-19 17:10:14 +00:00
die("shader compile fail\n");
}
glDeleteShader(vs);
glDeleteShader(ps);
glcache.UseProgram(program);
2013-12-19 17:10:14 +00:00
verify(glIsProgram(program));
return program;
}
PipelineShader *GetProgram(u32 cp_AlphaTest, u32 pp_ClipTestMode,
2013-12-19 17:10:14 +00:00
u32 pp_Texture, u32 pp_UseAlpha, u32 pp_IgnoreTexA, u32 pp_ShadInstr, u32 pp_Offset,
u32 pp_FogCtrl, bool pp_Gouraud, bool pp_BumpMap, bool fog_clamping, bool trilinear)
2013-12-19 17:10:14 +00:00
{
u32 rv=0;
rv|=pp_ClipTestMode;
rv<<=1; rv|=cp_AlphaTest;
rv<<=1; rv|=pp_Texture;
rv<<=1; rv|=pp_UseAlpha;
rv<<=1; rv|=pp_IgnoreTexA;
rv<<=2; rv|=pp_ShadInstr;
rv<<=1; rv|=pp_Offset;
rv<<=2; rv|=pp_FogCtrl;
2018-07-01 18:25:06 +00:00
rv<<=1; rv|=pp_Gouraud;
2018-07-02 13:23:47 +00:00
rv<<=1; rv|=pp_BumpMap;
2018-09-01 10:56:37 +00:00
rv<<=1; rv|=fog_clamping;
rv<<=1; rv|=trilinear;
2013-12-19 17:10:14 +00:00
PipelineShader *shader = &gl.shaders[rv];
if (shader->program == 0)
{
shader->cp_AlphaTest = cp_AlphaTest;
shader->pp_ClipTestMode = pp_ClipTestMode-1;
shader->pp_Texture = pp_Texture;
shader->pp_UseAlpha = pp_UseAlpha;
shader->pp_IgnoreTexA = pp_IgnoreTexA;
shader->pp_ShadInstr = pp_ShadInstr;
shader->pp_Offset = pp_Offset;
shader->pp_FogCtrl = pp_FogCtrl;
shader->pp_Gouraud = pp_Gouraud;
shader->pp_BumpMap = pp_BumpMap;
shader->fog_clamping = fog_clamping;
shader->trilinear = trilinear;
CompilePipelineShader(shader);
}
return shader;
2013-12-19 17:10:14 +00:00
}
bool CompilePipelineShader( PipelineShader* s)
{
2018-07-01 18:25:06 +00:00
char vshader[8192];
sprintf(vshader, VertexShaderSource, gl.glsl_version_header, gl.gl_version, s->pp_Gouraud);
2013-12-19 17:10:14 +00:00
char pshader[8192];
sprintf(pshader,PixelPipelineShader, gl.glsl_version_header, gl.gl_version,
2013-12-19 17:10:14 +00:00
s->cp_AlphaTest,s->pp_ClipTestMode,s->pp_UseAlpha,
2018-09-01 10:56:37 +00:00
s->pp_Texture,s->pp_IgnoreTexA,s->pp_ShadInstr,s->pp_Offset,s->pp_FogCtrl, s->pp_Gouraud, s->pp_BumpMap,
s->fog_clamping, s->trilinear);
2013-12-19 17:10:14 +00:00
2018-07-01 18:25:06 +00:00
s->program=gl_CompileAndLink(vshader, pshader);
2013-12-19 17:10:14 +00:00
//setup texture 0 as the input for the shader
GLuint gu=glGetUniformLocation(s->program, "tex");
if (s->pp_Texture==1)
glUniform1i(gu,0);
//get the uniform locations
s->depth_scale = glGetUniformLocation(s->program, "depth_scale");
s->extra_depth_scale = glGetUniformLocation(s->program, "extra_depth_scale");
s->pp_ClipTest = glGetUniformLocation(s->program, "pp_ClipTest");
s->sp_FOG_DENSITY = glGetUniformLocation(s->program, "sp_FOG_DENSITY");
2013-12-19 17:10:14 +00:00
s->cp_AlphaTestValue= glGetUniformLocation(s->program, "cp_AlphaTestValue");
//FOG_COL_RAM,FOG_COL_VERT,FOG_DENSITY;
if (s->pp_FogCtrl==1 && s->pp_Texture==1)
s->sp_FOG_COL_VERT=glGetUniformLocation(s->program, "sp_FOG_COL_VERT");
else
s->sp_FOG_COL_VERT=-1;
if (s->pp_FogCtrl==0 || s->pp_FogCtrl==3)
{
s->sp_FOG_COL_RAM=glGetUniformLocation(s->program, "sp_FOG_COL_RAM");
}
else
{
s->sp_FOG_COL_RAM=-1;
}
2018-10-28 23:31:24 +00:00
// Setup texture 1 as the fog table
gu = glGetUniformLocation(s->program, "fog_table");
if (gu != -1)
glUniform1i(gu, 1);
s->trilinear_alpha = glGetUniformLocation(s->program, "trilinear_alpha");
2018-09-01 10:56:37 +00:00
if (s->fog_clamping)
{
s->fog_clamp_min = glGetUniformLocation(s->program, "fog_clamp_min");
s->fog_clamp_max = glGetUniformLocation(s->program, "fog_clamp_max");
}
else
{
s->fog_clamp_min = -1;
s->fog_clamp_max = -1;
}
s->normal_matrix = glGetUniformLocation(s->program, "normal_matrix");
2013-12-19 17:10:14 +00:00
ShaderUniforms.Set(s);
return glIsProgram(s->program)==GL_TRUE;
}
static void SetupOSDVBO()
{
#ifndef GLES2
if (gl.gl_major >= 3)
{
if (gl.OSD_SHADER.vao == 0)
glGenVertexArrays(1, &gl.OSD_SHADER.vao);
glBindVertexArray(gl.OSD_SHADER.vao);
}
#endif
if (gl.OSD_SHADER.geometry == 0)
glGenBuffers(1, &gl.OSD_SHADER.geometry);
glBindBuffer(GL_ARRAY_BUFFER, gl.OSD_SHADER.geometry);
glBindBuffer(GL_ELEMENT_ARRAY_BUFFER, 0);
//setup vertex buffers attrib pointers
glEnableVertexAttribArray(VERTEX_POS_ARRAY);
glVertexAttribPointer(VERTEX_POS_ARRAY, 2, GL_FLOAT, GL_FALSE, sizeof(OSDVertex), (void*)offsetof(OSDVertex, x));
glEnableVertexAttribArray(VERTEX_COL_BASE_ARRAY);
glVertexAttribPointer(VERTEX_COL_BASE_ARRAY, 4, GL_UNSIGNED_BYTE, GL_TRUE, sizeof(OSDVertex), (void*)offsetof(OSDVertex, r));
glEnableVertexAttribArray(VERTEX_UV_ARRAY);
glVertexAttribPointer(VERTEX_UV_ARRAY, 2, GL_FLOAT, GL_FALSE, sizeof(OSDVertex), (void*)offsetof(OSDVertex, u));
glDisableVertexAttribArray(VERTEX_COL_OFFS_ARRAY);
glCheck();
}
2013-12-19 17:10:14 +00:00
2018-10-04 12:49:20 +00:00
void gl_load_osd_resources()
{
char vshader[8192];
char fshader[8192];
sprintf(vshader, OSD_VertexShader, gl.glsl_version_header, gl.gl_version);
sprintf(fshader, OSD_Shader, gl.glsl_version_header, gl.gl_version);
gl.OSD_SHADER.program = gl_CompileAndLink(vshader, fshader);
gl.OSD_SHADER.scale = glGetUniformLocation(gl.OSD_SHADER.program, "scale");
glUniform1i(glGetUniformLocation(gl.OSD_SHADER.program, "tex"), 0); //bind osd texture to slot 0
2018-10-04 12:49:20 +00:00
#ifdef __ANDROID__
2018-10-04 12:49:20 +00:00
int w, h;
if (gl.OSD_SHADER.osd_tex == 0)
gl.OSD_SHADER.osd_tex = loadPNG(get_readonly_data_path(DATA_PATH "buttons.png"), w, h);
2014-02-28 21:42:32 +00:00
#endif
SetupOSDVBO();
2018-10-04 12:49:20 +00:00
}
2013-12-19 17:10:14 +00:00
void gl_free_osd_resources()
{
glcache.DeleteProgram(gl.OSD_SHADER.program);
if (gl.OSD_SHADER.osd_tex != 0) {
glcache.DeleteTextures(1, &gl.OSD_SHADER.osd_tex);
gl.OSD_SHADER.osd_tex = 0;
}
glDeleteBuffers(1, &gl.OSD_SHADER.geometry);
gl.OSD_SHADER.geometry = 0;
#ifndef GLES2
glDeleteVertexArrays(1, &gl.OSD_SHADER.vao);
gl.OSD_SHADER.vao = 0;
#endif
}
static void create_modvol_shader()
{
if (gl.modvol_shader.program != 0)
return;
char vshader[8192];
sprintf(vshader, VertexShaderSource, gl.glsl_version_header, gl.gl_version, 1);
char fshader[8192];
sprintf(fshader, ModifierVolumeShader, gl.glsl_version_header, gl.gl_version);
gl.modvol_shader.program = gl_CompileAndLink(vshader, fshader);
gl.modvol_shader.normal_matrix = glGetUniformLocation(gl.modvol_shader.program, "normal_matrix");
gl.modvol_shader.sp_ShaderColor = glGetUniformLocation(gl.modvol_shader.program, "sp_ShaderColor");
gl.modvol_shader.depth_scale = glGetUniformLocation(gl.modvol_shader.program, "depth_scale");
gl.modvol_shader.extra_depth_scale = glGetUniformLocation(gl.modvol_shader.program, "extra_depth_scale");
}
2013-12-19 17:10:14 +00:00
bool gl_create_resources()
{
if (gl.vbo.geometry != 0)
// Assume the resources have already been created
return true;
findGLVersion();
if (gl.gl_major >= 3)
{
verify(glGenVertexArrays != NULL);
//create vao
//This is really not "proper", vaos are supposed to be defined once
//i keep updating the same one to make the es2 code work in 3.1 context
#ifndef GLES2
glGenVertexArrays(1, &gl.vbo.vao);
#endif
}
2013-12-19 17:10:14 +00:00
//create vbos
glGenBuffers(1, &gl.vbo.geometry);
glGenBuffers(1, &gl.vbo.modvols);
glGenBuffers(1, &gl.vbo.idxs);
glGenBuffers(1, &gl.vbo.idxs2);
create_modvol_shader();
2013-12-19 17:10:14 +00:00
2018-10-04 12:49:20 +00:00
gl_load_osd_resources();
2013-12-19 17:10:14 +00:00
return true;
}
GLuint gl_CompileShader(const char* shader,GLuint type);
bool gl_create_resources();
//setup
bool gles_init()
{
2018-10-05 13:07:30 +00:00
glcache.EnableCache();
2013-12-19 17:10:14 +00:00
if (!gl_create_resources())
return false;
2018-10-04 08:29:23 +00:00
// glEnable(GL_DEBUG_OUTPUT);
// glEnable(GL_DEBUG_OUTPUT_SYNCHRONOUS);
// glDebugMessageCallback(gl_DebugOutput, NULL);
// glDebugMessageControl(GL_DONT_CARE, GL_DONT_CARE, GL_DONT_CARE, 0, NULL, GL_TRUE);
//clean up the buffer
glcache.ClearColor(0.f, 0.f, 0.f, 0.f);
glClear(GL_COLOR_BUFFER_BIT);
theGLContext.Swap();
#ifdef GL_GENERATE_MIPMAP_HINT
if (gl.is_gles)
glHint(GL_GENERATE_MIPMAP_HINT, GL_FASTEST);
2018-05-15 20:37:40 +00:00
#endif
glCheck();
2018-05-15 20:37:40 +00:00
2018-08-01 17:43:01 +00:00
if (settings.rend.TextureUpscale > 1)
2013-12-19 17:10:14 +00:00
{
2018-08-01 17:43:01 +00:00
// Trick to preload the tables used by xBRZ
u32 src[] { 0x11111111, 0x22222222, 0x33333333, 0x44444444 };
u32 dst[16];
UpscalexBRZ(2, src, dst, 2, 2, false);
2013-12-19 17:10:14 +00:00
}
2018-10-05 13:07:30 +00:00
fog_needs_update = true;
2013-12-19 17:10:14 +00:00
return true;
}
2018-10-28 23:31:24 +00:00
void UpdateFogTexture(u8 *fog_table, GLenum texture_slot, GLint fog_image_format)
2013-12-19 17:10:14 +00:00
{
2018-10-28 23:31:24 +00:00
glActiveTexture(texture_slot);
if (fogTextureId == 0)
2013-12-19 17:10:14 +00:00
{
2018-06-05 10:18:09 +00:00
fogTextureId = glcache.GenTexture();
glcache.BindTexture(GL_TEXTURE_2D, fogTextureId);
glcache.TexParameteri(GL_TEXTURE_2D, GL_TEXTURE_MIN_FILTER, GL_LINEAR);
glcache.TexParameteri(GL_TEXTURE_2D, GL_TEXTURE_MAG_FILTER, GL_LINEAR);
glcache.TexParameteri(GL_TEXTURE_2D, GL_TEXTURE_WRAP_S, GL_CLAMP_TO_EDGE);
glcache.TexParameteri(GL_TEXTURE_2D, GL_TEXTURE_WRAP_T, GL_CLAMP_TO_EDGE);
2013-12-19 17:10:14 +00:00
}
2018-10-28 23:31:24 +00:00
else
2018-06-05 10:18:09 +00:00
glcache.BindTexture(GL_TEXTURE_2D, fogTextureId);
2013-12-19 17:10:14 +00:00
2018-10-28 23:31:24 +00:00
u8 temp_tex_buffer[256];
2019-10-06 15:02:17 +00:00
MakeFogTexture(temp_tex_buffer);
2018-10-28 23:31:24 +00:00
glPixelStorei(GL_UNPACK_ALIGNMENT, 1);
glTexImage2D(GL_TEXTURE_2D, 0, fog_image_format, 128, 2, 0, fog_image_format, GL_UNSIGNED_BYTE, temp_tex_buffer);
glCheck();
2013-12-19 17:10:14 +00:00
2018-10-28 23:31:24 +00:00
glActiveTexture(GL_TEXTURE0);
}
2013-12-19 17:10:14 +00:00
void OSD_DRAW(bool clear_screen)
2013-12-19 17:10:14 +00:00
{
#ifdef __ANDROID__
if (gl.OSD_SHADER.osd_tex == 0)
gl_load_osd_resources();
if (gl.OSD_SHADER.osd_tex != 0)
2013-12-19 17:10:14 +00:00
{
const std::vector<OSDVertex>& osdVertices = GetOSDVertices();
#ifndef GLES2
if (gl.gl_major >= 3)
glBindVertexArray(gl.OSD_SHADER.vao);
else
#endif
SetupOSDVBO();
2013-12-19 17:10:14 +00:00
glBindBuffer(GL_ARRAY_BUFFER, gl.OSD_SHADER.geometry);
2013-12-19 17:10:14 +00:00
verify(glIsProgram(gl.OSD_SHADER.program));
glcache.UseProgram(gl.OSD_SHADER.program);
2013-12-19 17:10:14 +00:00
float scale_h = screen_height / 480.f;
float offs_x = (screen_width - scale_h * 640.f) / 2.f;
float scale[4];
scale[0] = 2.f / (screen_width / scale_h);
scale[1]= -2.f / 480.f;
scale[2]= 1.f - 2.f * offs_x / screen_width;
scale[3]= -1.f;
glUniform4fv(gl.OSD_SHADER.scale, 1, scale);
2014-01-21 15:39:05 +00:00
glActiveTexture(GL_TEXTURE0);
glcache.BindTexture(GL_TEXTURE_2D, gl.OSD_SHADER.osd_tex);
2014-01-21 15:39:05 +00:00
glBindFramebuffer(GL_FRAMEBUFFER, 0);
glBufferData(GL_ARRAY_BUFFER, osdVertices.size() * sizeof(OSDVertex), osdVertices.data(), GL_STREAM_DRAW); glCheck();
2014-01-21 15:39:05 +00:00
glcache.Enable(GL_BLEND);
glcache.Disable(GL_DEPTH_TEST);
glcache.BlendFunc(GL_SRC_ALPHA, GL_ONE_MINUS_SRC_ALPHA);
2013-12-19 17:10:14 +00:00
glcache.DepthMask(false);
glcache.DepthFunc(GL_ALWAYS);
2013-12-19 17:10:14 +00:00
glcache.Disable(GL_CULL_FACE);
glcache.Disable(GL_SCISSOR_TEST);
glViewport(0, 0, screen_width, screen_height);
2013-12-19 17:10:14 +00:00
if (clear_screen)
{
glcache.ClearColor(0.7f, 0.7f, 0.7f, 1.f);
glClear(GL_COLOR_BUFFER_BIT);
}
int dfa = osdVertices.size() / 4;
2013-12-19 17:10:14 +00:00
2019-02-18 23:49:24 +00:00
for (int i = 0; i < dfa; i++)
glDrawArrays(GL_TRIANGLE_STRIP, i * 4, 4);
glCheck();
2013-12-19 17:10:14 +00:00
}
2014-02-28 21:42:32 +00:00
#endif
gui_display_osd();
2013-12-19 17:10:14 +00:00
}
bool ProcessFrame(TA_context* ctx)
{
ctx->rend_inuse.Lock();
if (KillTex)
TexCache.Clear();
2018-08-26 14:58:10 +00:00
if (ctx->rend.isRenderFramebuffer)
{
RenderFramebuffer();
ctx->rend_inuse.Unlock();
}
2018-08-26 14:58:10 +00:00
else
{
if (!ta_parse_vdrc(ctx))
return false;
}
TexCache.CollectCleanup();
if (ctx->rend.Overrun)
WARN_LOG(PVR, "ERROR: TA context overrun");
return !ctx->rend.Overrun;
}
static void upload_vertex_indices()
2013-12-19 17:10:14 +00:00
{
if (gl.index_type == GL_UNSIGNED_SHORT)
{
static bool overrun;
static List<u16> short_idx;
if (short_idx.daty != NULL)
short_idx.Free();
short_idx.Init(pvrrc.idx.used(), &overrun, NULL);
for (u32 *p = pvrrc.idx.head(); p < pvrrc.idx.LastPtr(0); p++)
*(short_idx.Append()) = *p;
glBufferData(GL_ELEMENT_ARRAY_BUFFER, short_idx.bytes(), short_idx.head(), GL_STREAM_DRAW);
}
else
glBufferData(GL_ELEMENT_ARRAY_BUFFER,pvrrc.idx.bytes(),pvrrc.idx.head(),GL_STREAM_DRAW);
glCheck();
}
void GetFramebufferScaling(float& scale_x, float& scale_y, float& scissoring_scale_x, float& scissoring_scale_y)
{
scale_x = 1;
scale_y = 1;
scissoring_scale_x = 1;
scissoring_scale_y = 1;
if (!pvrrc.isRTT && !pvrrc.isRenderFramebuffer)
2013-12-19 17:10:14 +00:00
{
scale_x = fb_scale_x;
scale_y = fb_scale_y;
if (SCALER_CTL.vscalefactor >= 0x400)
{
// Interlace mode A (single framebuffer)
if (SCALER_CTL.interlace == 0)
scale_y *= (float)SCALER_CTL.vscalefactor / 0x400;
else
// Interlace mode B (alternating framebuffers)
scissoring_scale_y /= (float)SCALER_CTL.vscalefactor / 0x400;
}
// VO pixel doubling is done after fb rendering/clipping
// so it should be used for scissoring as well
if (VO_CONTROL.pixel_double)
scale_x *= 0.5f;
// the X Scaler halves the horizontal resolution but
// before clipping/scissoring
if (SCALER_CTL.hscale)
{
scissoring_scale_x /= 2.f;
scale_x *= 2.f;
}
2013-12-19 17:10:14 +00:00
}
}
2013-12-19 17:10:14 +00:00
void GetFramebufferSize(float& dc_width, float& dc_height)
{
if (pvrrc.isRTT)
{
dc_width = pvrrc.fb_X_CLIP.max - pvrrc.fb_X_CLIP.min + 1;
dc_height = pvrrc.fb_Y_CLIP.max - pvrrc.fb_Y_CLIP.min + 1;
2013-12-19 17:10:14 +00:00
}
else
{
dc_width = 640;
dc_height = 480;
}
}
2013-12-19 17:10:14 +00:00
void SetupMatrices(float dc_width, float dc_height,
float scale_x, float scale_y, float scissoring_scale_x, float scissoring_scale_y,
float &ds2s_offs_x, glm::mat4& normal_mat, glm::mat4& scissor_mat)
{
float screen_scaling = settings.rend.ScreenScaling / 100.f;
if (pvrrc.isRTT)
2013-12-19 17:10:14 +00:00
{
ShaderUniforms.normal_mat = glm::translate(glm::vec3(-1, -1, 0))
* glm::scale(glm::vec3(2.0f / dc_width, 2.0f / dc_height, 1.f));
scissor_mat = ShaderUniforms.normal_mat;
}
else
{
float startx = 0;
float starty = 0;
bool vga = FB_R_CTRL.vclk_div == 1;
switch (SPG_LOAD.hcount)
{
case 857: // NTSC, VGA
startx = VO_STARTX.HStart - (vga ? 0xa8 : 0xa4);
break;
case 863: // PAL
startx = VO_STARTX.HStart - 0xae;
break;
default:
INFO_LOG(PVR, "unknown video mode: hcount %d", SPG_LOAD.hcount);
break;
}
switch (SPG_LOAD.vcount)
{
case 524: // NTSC, VGA
starty = VO_STARTY.VStart_field1 - (vga ? 0x28 : 0x12);
break;
case 262: // NTSC 240p
starty = VO_STARTY.VStart_field1 - 0x11;
break;
case 624: // PAL
starty = VO_STARTY.VStart_field1 - 0x2d;
break;
case 312: // PAL 240p
starty = VO_STARTY.VStart_field1 - 0x2e;
break;
default:
INFO_LOG(PVR, "unknown video mode: vcount %d", SPG_LOAD.vcount);
break;
}
// some heuristic...
startx *= 0.8;
starty *= 1.1;
normal_mat = glm::translate(glm::vec3(startx, starty, 0));
scissor_mat = normal_mat;
float screen_stretching = settings.rend.ScreenStretching / 100.f;
float dc2s_scale_h;
if (settings.rend.Rotate90)
{
dc2s_scale_h = screen_height / 640.0f;
ds2s_offs_x = (screen_width - dc2s_scale_h * 480.0f * screen_stretching) / 2;
float y_coef = 2.0f / (screen_width / dc2s_scale_h * scale_y) * screen_stretching;
float x_coef = -2.0f / dc_width;
glm::mat4 trans_rot = glm::rotate((float)M_PI_2, glm::vec3(0, 0, 1))
* glm::translate(glm::vec3(1, -1 + 2 * ds2s_offs_x / screen_width, 0));
normal_mat = trans_rot
* glm::scale(glm::vec3(x_coef, y_coef, 1.f))
* normal_mat;
scissor_mat = trans_rot
* glm::scale(glm::vec3(x_coef / scissoring_scale_x,
y_coef/ scissoring_scale_y, 1.f))
* scissor_mat; // FIXME scale_x not used, except in dc_width???
}
else
{
dc2s_scale_h = screen_height / 480.0f;
ds2s_offs_x = (screen_width - dc2s_scale_h * 640.0f * screen_stretching) / 2;
float x_coef = 2.0f / (screen_width / dc2s_scale_h * scale_x) * screen_stretching;
float y_coef = -2.0f / dc_height;
normal_mat = glm::translate(glm::vec3(-1 + 2 * ds2s_offs_x / screen_width, 1, 0))
* glm::scale(glm::vec3(x_coef, y_coef, 1.f))
* normal_mat;
scissor_mat = glm::translate(glm::vec3(-1 + 2 * ds2s_offs_x / screen_width, 1, 0))
* glm::scale(glm::vec3(x_coef / scissoring_scale_x,
y_coef / scissoring_scale_y, 1.f))
* scissor_mat;
}
2013-12-19 17:10:14 +00:00
}
normal_mat = glm::scale(glm::vec3(1, 1, 1 / settings.rend.ExtraDepthScale))
* normal_mat;
2013-12-19 17:10:14 +00:00
glm::mat4 vp_trans = glm::translate(glm::vec3(1, 1, 0));
if (pvrrc.isRTT)
{
vp_trans = glm::scale(glm::vec3(dc_width / 2, dc_height / 2, 1.f))
* vp_trans;
}
else
{
vp_trans = glm::scale(glm::vec3(screen_width * screen_scaling / 2, screen_height * screen_scaling / 2, 1.f))
* vp_trans;
}
ViewportMatrix = vp_trans * normal_mat;
scissor_mat = vp_trans * scissor_mat;
}
2013-12-19 17:10:14 +00:00
bool RenderFrame()
{
DoCleanup();
create_modvol_shader();
2013-12-19 17:10:14 +00:00
bool is_rtt = pvrrc.isRTT;
2013-12-19 17:10:14 +00:00
float vtx_min_fZ = 0.f; //pvrrc.fZ_min;
float vtx_max_fZ = pvrrc.fZ_max;
2013-12-19 17:10:14 +00:00
//sanitise the values, now with NaN detection (for omap)
//0x49800000 is 1024*1024. Using integer math to avoid issues w/ infs and nans
if ((s32&)vtx_max_fZ < 0 || (u32&)vtx_max_fZ > 0x49800000)
vtx_max_fZ = 10 * 1024;
2013-12-19 17:10:14 +00:00
//add some extra range to avoid clipping border cases
vtx_min_fZ *= 0.98f;
vtx_max_fZ *= 1.001f;
2013-12-19 17:10:14 +00:00
//calculate a projection so that it matches the pvr x,y setup, and
//a) Z is linearly scaled between 0 ... 1
//b) W is passed though for proper perspective calculations
2013-12-19 17:10:14 +00:00
//these should be adjusted based on the current PVR scaling etc params
float dc_width;
float dc_height;
GetFramebufferSize(dc_width, dc_height);
2013-12-19 17:10:14 +00:00
if (!is_rtt)
gcflip = 0;
else
gcflip = 1;
2013-12-19 17:10:14 +00:00
float scale_x;
float scale_y;
float scissoring_scale_x;
float scissoring_scale_y;
GetFramebufferScaling(scale_x, scale_y, scissoring_scale_x, scissoring_scale_y);
dc_width *= scale_x;
dc_height *= scale_y;
2013-12-19 17:10:14 +00:00
/*
Handle Dc to screen scaling
*/
float screen_scaling = settings.rend.ScreenScaling / 100.f;
2013-12-19 17:10:14 +00:00
float ds2s_offs_x;
2013-12-19 17:10:14 +00:00
glm::mat4 scissor_mat;
SetupMatrices(dc_width, dc_height, scale_x, scale_y, scissoring_scale_x, scissoring_scale_y, ds2s_offs_x, ShaderUniforms.normal_mat, scissor_mat);
2013-12-19 17:10:14 +00:00
ShaderUniforms.depth_coefs[0] = 2 / (vtx_max_fZ - vtx_min_fZ);
ShaderUniforms.depth_coefs[1] = -vtx_min_fZ - 1;
ShaderUniforms.depth_coefs[2] = 0;
ShaderUniforms.depth_coefs[3] = 0;
2013-12-19 17:10:14 +00:00
ShaderUniforms.extra_depth_scale = settings.rend.ExtraDepthScale;
2013-12-19 17:10:14 +00:00
//VERT and RAM fog color constants
u8* fog_colvert_bgra = (u8*)&FOG_COL_VERT;
u8* fog_colram_bgra = (u8*)&FOG_COL_RAM;
ShaderUniforms.ps_FOG_COL_VERT[0] = fog_colvert_bgra[2] / 255.0f;
ShaderUniforms.ps_FOG_COL_VERT[1] = fog_colvert_bgra[1] / 255.0f;
ShaderUniforms.ps_FOG_COL_VERT[2] = fog_colvert_bgra[0] / 255.0f;
2013-12-19 17:10:14 +00:00
ShaderUniforms.ps_FOG_COL_RAM[0] = fog_colram_bgra[2] / 255.0f;
ShaderUniforms.ps_FOG_COL_RAM[1] = fog_colram_bgra[1] / 255.0f;
ShaderUniforms.ps_FOG_COL_RAM[2] = fog_colram_bgra[0] / 255.0f;
2013-12-19 17:10:14 +00:00
//Fog density constant
u8* fog_density = (u8*)&FOG_DENSITY;
float fog_den_mant = fog_density[1] / 128.0f; //bit 7 -> x. bit, so [6:0] -> fraction -> /128
s32 fog_den_exp = (s8)fog_density[0];
ShaderUniforms.fog_den_float = fog_den_mant * powf(2.0f, fog_den_exp);
2013-12-19 17:10:14 +00:00
2018-09-01 10:56:37 +00:00
ShaderUniforms.fog_clamp_min[0] = ((pvrrc.fog_clamp_min >> 16) & 0xFF) / 255.0f;
ShaderUniforms.fog_clamp_min[1] = ((pvrrc.fog_clamp_min >> 8) & 0xFF) / 255.0f;
ShaderUniforms.fog_clamp_min[2] = ((pvrrc.fog_clamp_min >> 0) & 0xFF) / 255.0f;
ShaderUniforms.fog_clamp_min[3] = ((pvrrc.fog_clamp_min >> 24) & 0xFF) / 255.0f;
ShaderUniforms.fog_clamp_max[0] = ((pvrrc.fog_clamp_max >> 16) & 0xFF) / 255.0f;
ShaderUniforms.fog_clamp_max[1] = ((pvrrc.fog_clamp_max >> 8) & 0xFF) / 255.0f;
ShaderUniforms.fog_clamp_max[2] = ((pvrrc.fog_clamp_max >> 0) & 0xFF) / 255.0f;
ShaderUniforms.fog_clamp_max[3] = ((pvrrc.fog_clamp_max >> 24) & 0xFF) / 255.0f;
if (fog_needs_update && settings.rend.Fog)
2013-12-19 17:10:14 +00:00
{
2018-10-28 23:31:24 +00:00
fog_needs_update = false;
UpdateFogTexture((u8 *)FOG_TABLE, GL_TEXTURE1, gl.fog_image_format);
2013-12-19 17:10:14 +00:00
}
glcache.UseProgram(gl.modvol_shader.program);
2013-12-19 17:10:14 +00:00
glUniform4fv( gl.modvol_shader.depth_scale, 1, ShaderUniforms.depth_coefs);
glUniform1f(gl.modvol_shader.extra_depth_scale, ShaderUniforms.extra_depth_scale);
glUniformMatrix4fv(gl.modvol_shader.normal_matrix, 1, GL_FALSE, &ShaderUniforms.normal_mat[0][0]);
2013-12-19 17:10:14 +00:00
ShaderUniforms.PT_ALPHA=(PT_ALPHA_REF&0xFF)/255.0f;
for (auto& it : gl.shaders)
{
glcache.UseProgram(it.second.program);
ShaderUniforms.Set(&it.second);
}
2013-12-19 17:10:14 +00:00
//setup render target first
if (is_rtt)
{
GLuint channels,format;
switch(FB_W_CTRL.fb_packmode)
{
case 0: //0x0 0555 KRGB 16 bit (default) Bit 15 is the value of fb_kval[7].
2013-12-19 17:10:14 +00:00
channels=GL_RGBA;
format=GL_UNSIGNED_BYTE;
2013-12-19 17:10:14 +00:00
break;
case 1: //0x1 565 RGB 16 bit
2013-12-19 17:10:14 +00:00
channels=GL_RGB;
format=GL_UNSIGNED_SHORT_5_6_5;
break;
case 2: //0x2 4444 ARGB 16 bit
2013-12-19 17:10:14 +00:00
channels=GL_RGBA;
format=GL_UNSIGNED_BYTE;
2013-12-19 17:10:14 +00:00
break;
case 3://0x3 1555 ARGB 16 bit The alpha value is determined by comparison with the value of fb_alpha_threshold.
2013-12-19 17:10:14 +00:00
channels=GL_RGBA;
format=GL_UNSIGNED_BYTE;
2013-12-19 17:10:14 +00:00
break;
case 4: //0x4 888 RGB 24 bit packed
case 5: //0x5 0888 KRGB 32 bit K is the value of fk_kval.
case 6: //0x6 8888 ARGB 32 bit
WARN_LOG(RENDERER, "Unsupported render to texture format: %d", FB_W_CTRL.fb_packmode);
return false;
case 7: //7 invalid
2013-12-19 17:10:14 +00:00
die("7 is not valid");
break;
}
DEBUG_LOG(RENDERER, "RTT packmode=%d stride=%d - %d,%d -> %d,%d", FB_W_CTRL.fb_packmode, FB_W_LINESTRIDE.stride * 8,
FB_X_CLIP.min, FB_Y_CLIP.min, FB_X_CLIP.max, FB_Y_CLIP.max);
BindRTT(FB_W_SOF1 & VRAM_MASK, dc_width, dc_height, channels, format);
2013-12-19 17:10:14 +00:00
}
else
{
if (settings.rend.ScreenScaling != 100 || !theGLContext.IsSwapBufferPreserved())
2019-02-18 23:49:24 +00:00
{
2019-08-17 15:19:33 +00:00
init_output_framebuffer((int)lroundf(screen_width * screen_scaling), (int)lroundf(screen_height * screen_scaling));
}
2019-02-18 23:49:24 +00:00
else
{
#if HOST_OS != OS_DARWIN
2019-02-18 23:49:24 +00:00
//Fix this in a proper way
glBindFramebuffer(GL_FRAMEBUFFER,0);
#endif
glViewport(0, 0, screen_width, screen_height);
}
2013-12-19 17:10:14 +00:00
}
bool wide_screen_on = !is_rtt && settings.rend.WideScreen
&& pvrrc.fb_X_CLIP.min == 0
2019-08-17 15:19:33 +00:00
&& lroundf((pvrrc.fb_X_CLIP.max + 1) / scale_x) == 640L
&& pvrrc.fb_Y_CLIP.min == 0
2019-08-17 15:19:33 +00:00
&& lroundf((pvrrc.fb_Y_CLIP.max + 1) / scale_y) == 480L;
2013-12-19 17:10:14 +00:00
//Color is cleared by the background plane
2013-12-19 17:10:14 +00:00
glcache.Disable(GL_SCISSOR_TEST);
2013-12-19 17:10:14 +00:00
glcache.DepthMask(GL_TRUE);
glClearDepthf(0.0);
glStencilMask(0xFF); glCheck();
glClearStencil(0);
glClear(GL_STENCIL_BUFFER_BIT | GL_DEPTH_BUFFER_BIT); glCheck();
2013-12-19 17:10:14 +00:00
//move vertex to gpu
2018-08-26 14:58:10 +00:00
if (!pvrrc.isRenderFramebuffer)
2013-12-19 17:10:14 +00:00
{
2018-08-26 14:58:10 +00:00
//Main VBO
glBindBuffer(GL_ARRAY_BUFFER, gl.vbo.geometry); glCheck();
glBindBuffer(GL_ELEMENT_ARRAY_BUFFER, gl.vbo.idxs); glCheck();
2013-12-19 17:10:14 +00:00
2018-08-26 14:58:10 +00:00
glBufferData(GL_ARRAY_BUFFER,pvrrc.verts.bytes(),pvrrc.verts.head(),GL_STREAM_DRAW); glCheck();
2015-05-08 15:44:27 +00:00
upload_vertex_indices();
2015-05-08 15:44:27 +00:00
2018-08-26 14:58:10 +00:00
//Modvol VBO
if (pvrrc.modtrig.used())
2019-02-09 22:59:16 +00:00
{
2018-08-26 14:58:10 +00:00
glBindBuffer(GL_ARRAY_BUFFER, gl.vbo.modvols); glCheck();
glBufferData(GL_ARRAY_BUFFER,pvrrc.modtrig.bytes(),pvrrc.modtrig.head(),GL_STREAM_DRAW); glCheck();
2019-02-09 22:59:16 +00:00
}
2013-12-19 17:10:14 +00:00
2018-08-26 14:58:10 +00:00
if (!wide_screen_on)
2019-02-09 22:59:16 +00:00
{
float width;
float height;
float min_x;
float min_y;
2018-08-26 14:58:10 +00:00
if (!is_rtt)
{
glm::vec4 clip_min(pvrrc.fb_X_CLIP.min, pvrrc.fb_Y_CLIP.min, 0, 1);
glm::vec4 clip_dim(pvrrc.fb_X_CLIP.max - pvrrc.fb_X_CLIP.min + 1,
pvrrc.fb_Y_CLIP.max - pvrrc.fb_Y_CLIP.min + 1, 0, 0);
clip_min = scissor_mat * clip_min;
clip_dim = scissor_mat * clip_dim;
min_x = clip_min[0];
min_y = clip_min[1];
width = clip_dim[0];
height = clip_dim[1];
if (width < 0)
{
min_x += width;
width = -width;
}
if (height < 0)
{
min_y += height;
height = -height;
}
if (ds2s_offs_x > 0)
{
float scaled_offs_x = ds2s_offs_x * screen_scaling;
2018-10-05 13:07:30 +00:00
glcache.ClearColor(0.f, 0.f, 0.f, 0.f);
glcache.Enable(GL_SCISSOR_TEST);
2019-08-17 15:19:33 +00:00
glScissor(0, 0, (GLsizei)lroundf(scaled_offs_x), (GLsizei)lroundf(screen_height * screen_scaling));
glClear(GL_COLOR_BUFFER_BIT);
glScissor(screen_width * screen_scaling - scaled_offs_x, 0, (GLsizei)lroundf(scaled_offs_x + 1.f), (GLsizei)lroundf(screen_height * screen_scaling));
glClear(GL_COLOR_BUFFER_BIT);
}
2018-08-26 14:58:10 +00:00
}
else
2018-08-26 14:58:10 +00:00
{
width = pvrrc.fb_X_CLIP.max - pvrrc.fb_X_CLIP.min + 1;
height = pvrrc.fb_Y_CLIP.max - pvrrc.fb_Y_CLIP.min + 1;
min_x = pvrrc.fb_X_CLIP.min;
min_y = pvrrc.fb_Y_CLIP.min;
if (settings.rend.RenderToTextureUpscale > 1 && !settings.rend.RenderToTextureBuffer)
{
min_x *= settings.rend.RenderToTextureUpscale;
min_y *= settings.rend.RenderToTextureUpscale;
width *= settings.rend.RenderToTextureUpscale;
height *= settings.rend.RenderToTextureUpscale;
}
2018-08-26 14:58:10 +00:00
}
2019-08-17 15:19:33 +00:00
glScissor((GLint)lroundf(min_x), (GLint)lroundf(min_y), (GLsizei)lroundf(width), (GLsizei)lroundf(height));
2018-08-26 14:58:10 +00:00
glcache.Enable(GL_SCISSOR_TEST);
}
2013-12-19 17:10:14 +00:00
DrawStrips();
}
2018-08-26 14:58:10 +00:00
else
{
glcache.ClearColor(0.f, 0.f, 0.f, 0.f);
glClear(GL_COLOR_BUFFER_BIT);
DrawFramebuffer();
2018-08-26 14:58:10 +00:00
}
#ifdef _WIN32
2013-12-19 17:10:14 +00:00
//Sleep(40); //to test MT stability
#endif
eglCheck();
2018-05-08 16:47:00 +00:00
if (is_rtt)
ReadRTTBuffer();
else if (settings.rend.ScreenScaling != 100 || !theGLContext.IsSwapBufferPreserved())
2019-02-18 23:49:24 +00:00
render_output_framebuffer();
2013-12-19 17:10:14 +00:00
return !is_rtt;
}
void rend_set_fb_scale(float x, float y)
2013-12-19 17:10:14 +00:00
{
fb_scale_x = x;
fb_scale_y = y;
2013-12-19 17:10:14 +00:00
}
struct glesrend : Renderer
{
bool Init() override { return gles_init(); }
void Resize(int w, int h) override { screen_width=w; screen_height=h; }
void Term() override
2018-10-29 17:02:47 +00:00
{
TexCache.Clear();
gles_term();
2018-10-29 17:02:47 +00:00
}
2013-12-19 17:10:14 +00:00
bool Process(TA_context* ctx) override { return ProcessFrame(ctx); }
bool Render() override
{
RenderFrame();
if (!pvrrc.isRTT)
DrawOSD(false);
return !pvrrc.isRTT;
}
bool RenderLastFrame() override { return !theGLContext.IsSwapBufferPreserved() ? render_output_framebuffer() : false; }
void Present() override { theGLContext.Swap(); glViewport(0, 0, screen_width, screen_height); }
void DrawOSD(bool clear_screen) override
{
OSD_DRAW(clear_screen);
}
virtual u64 GetTexture(TSP tsp, TCW tcw) override
{
return gl_GetTexture(tsp, tcw);
}
2013-12-19 17:10:14 +00:00
};
GLuint loadPNG(const string& fname, int &width, int &height)
2018-12-30 17:42:55 +00:00
{
png_byte *image_data = loadPNGData(fname, width, height);
if (image_data == NULL)
return TEXTURE_LOAD_ERROR;
2013-12-19 17:10:14 +00:00
//Now generate the OpenGL texture object
GLuint texture = glcache.GenTexture();
glcache.BindTexture(GL_TEXTURE_2D, texture);
2013-12-19 17:10:14 +00:00
glTexImage2D(GL_TEXTURE_2D, 0, GL_RGBA, width, height, 0, GL_RGBA,
GL_UNSIGNED_BYTE, (GLvoid*) image_data);
glcache.TexParameteri(GL_TEXTURE_2D, GL_TEXTURE_MIN_FILTER, GL_LINEAR);
2013-12-19 17:10:14 +00:00
delete[] image_data;
return texture;
}
Renderer* rend_GLES2() { return new glesrend(); }