fix shadow bugs

bahaahah
This commit is contained in:
Arisotura 2019-05-25 01:55:44 +02:00
parent 8a63c76f4f
commit 182e123598
2 changed files with 166 additions and 148 deletions

View File

@ -45,6 +45,7 @@ enum
GLuint ClearShaderPlain[3]; GLuint ClearShaderPlain[3];
GLuint RenderShader[16][3]; GLuint RenderShader[16][3];
GLuint CurShaderID = -1;
struct struct
{ {
@ -61,6 +62,7 @@ typedef struct
{ {
Polygon* PolyData; Polygon* PolyData;
u32 NumIndices;
u16* Indices; u16* Indices;
u32 RenderKey; u32 RenderKey;
@ -158,7 +160,9 @@ bool BuildRenderShader(u32 flags, const char* vs, const char* fs)
void UseRenderShader(u32 flags) void UseRenderShader(u32 flags)
{ {
if (CurShaderID == flags) return;
glUseProgram(RenderShader[flags][2]); glUseProgram(RenderShader[flags][2]);
CurShaderID = flags;
} }
void SetupDefaultTexParams(GLuint tex) void SetupDefaultTexParams(GLuint tex)
@ -311,10 +315,7 @@ bool Init()
glBindFramebuffer(GL_FRAMEBUFFER, FramebufferID[0]); glBindFramebuffer(GL_FRAMEBUFFER, FramebufferID[0]);
glEnable(GL_BLEND); glEnable(GL_BLEND);
// TODO: these are said to require GL 4.0; use the regular ones instead? glBlendEquationSeparate(GL_FUNC_ADD, GL_MAX);
glBlendFuncSeparatei(0, GL_SRC_ALPHA, GL_ONE_MINUS_SRC_ALPHA, GL_ONE, GL_ONE);
glBlendEquationSeparatei(0, GL_FUNC_ADD, GL_MAX);
glBlendFuncSeparatei(1, GL_ONE, GL_ZERO, GL_ONE, GL_ZERO);
glGenBuffers(1, &PixelbufferID); glGenBuffers(1, &PixelbufferID);
@ -335,7 +336,7 @@ bool Init()
glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_MIN_FILTER, GL_NEAREST); glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_MIN_FILTER, GL_NEAREST);
glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_MAG_FILTER, GL_NEAREST); glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_MAG_FILTER, GL_NEAREST);
glTexImage2D(GL_TEXTURE_2D, 0, GL_RGB5_A1, 1024, 48, 0, GL_RGBA, GL_UNSIGNED_SHORT_1_5_5_5_REV, NULL); glTexImage2D(GL_TEXTURE_2D, 0, GL_RGB5_A1, 1024, 48, 0, GL_RGBA, GL_UNSIGNED_SHORT_1_5_5_5_REV, NULL);
printf("init done. %04X\n", glGetError());
return true; return true;
} }
@ -486,6 +487,8 @@ void BuildPolygons(RendererPolygon* polygons, int npolys)
if (poly->FacingView) vtxattr |= (1<<8); if (poly->FacingView) vtxattr |= (1<<8);
if (poly->WBuffer) vtxattr |= (1<<9); if (poly->WBuffer) vtxattr |= (1<<9);
rp->NumIndices = 0;
// assemble vertices // assemble vertices
for (int j = 0; j < poly->NumVertices; j++) for (int j = 0; j < poly->NumVertices; j++)
{ {
@ -531,6 +534,7 @@ void BuildPolygons(RendererPolygon* polygons, int npolys)
*iptr++ = vidx - 1; *iptr++ = vidx - 1;
*iptr++ = vidx; *iptr++ = vidx;
numtriangles++; numtriangles++;
rp->NumIndices += 3;
} }
vidx++; vidx++;
@ -541,14 +545,38 @@ void BuildPolygons(RendererPolygon* polygons, int npolys)
NumVertices = vidx; NumVertices = vidx;
} }
void RenderSinglePolygon(int i)
{
RendererPolygon* rp = &PolygonList[i];
glDrawElements(GL_TRIANGLES, rp->NumIndices, GL_UNSIGNED_SHORT, rp->Indices);
}
int RenderPolygonBatch(int i)
{
RendererPolygon* rp = &PolygonList[i];
u32 key = rp->RenderKey;
int numpolys = 0;
u32 numindices = 0;
for (int iend = i; iend < NumFinalPolys; iend++)
{
RendererPolygon* cur_rp = &PolygonList[iend];
if (cur_rp->RenderKey != key) break;
numpolys++;
numindices += cur_rp->NumIndices;
}
glDrawElements(GL_TRIANGLES, numindices, GL_UNSIGNED_SHORT, rp->Indices);
return numpolys;
}
void RenderSceneChunk(int y, int h) void RenderSceneChunk(int y, int h)
{ {
u32 flags = 0; u32 flags = 0;
if (RenderPolygonRAM[0]->WBuffer) flags |= RenderFlag_WBuffer; if (RenderPolygonRAM[0]->WBuffer) flags |= RenderFlag_WBuffer;
u16* iptr;
u32 curkey;
if (h != 192) glScissor(0, y<<ScaleFactor, 256<<ScaleFactor, h<<ScaleFactor); if (h != 192) glScissor(0, y<<ScaleFactor, 256<<ScaleFactor, h<<ScaleFactor);
// pass 1: opaque pixels // pass 1: opaque pixels
@ -562,20 +590,9 @@ void RenderSceneChunk(int y, int h)
glBindVertexArray(VertexArrayID); glBindVertexArray(VertexArrayID);
iptr = PolygonList[0].Indices; for (int i = 0; i < NumFinalPolys; )
curkey = 0xFFFFFFFF;
for (int i = 0; i < NumFinalPolys; i++)
{ {
RendererPolygon* rp = &PolygonList[i]; RendererPolygon* rp = &PolygonList[i];
if (rp->RenderKey != curkey)
{
u16* endptr = rp->Indices;
u32 num = (u32)(endptr - iptr);
if (num) glDrawElements(GL_TRIANGLES, num, GL_UNSIGNED_SHORT, iptr);
iptr = rp->Indices;
curkey = rp->RenderKey;
// zorp // zorp
glDepthFunc(GL_LESS); glDepthFunc(GL_LESS);
@ -586,13 +603,8 @@ void RenderSceneChunk(int y, int h)
glStencilFunc(GL_ALWAYS, polyid, 0xFF); glStencilFunc(GL_ALWAYS, polyid, 0xFF);
glStencilOp(GL_KEEP, GL_KEEP, GL_REPLACE); glStencilOp(GL_KEEP, GL_KEEP, GL_REPLACE);
glStencilMask(0xFF); glStencilMask(0xFF);
}
}
{ i += RenderPolygonBatch(i);
u16* endptr = &IndexBuffer[NumTriangles*3];
u32 num = (u32)(endptr - iptr);
if (num) glDrawElements(GL_TRIANGLES, num, GL_UNSIGNED_SHORT, iptr);
} }
glEnable(GL_BLEND); glEnable(GL_BLEND);
@ -602,54 +614,81 @@ void RenderSceneChunk(int y, int h)
{ {
glColorMaski(1, GL_FALSE, GL_FALSE, GL_FALSE, GL_FALSE); glColorMaski(1, GL_FALSE, GL_FALSE, GL_FALSE, GL_FALSE);
if (PolygonList[NumOpaqueFinalPolys].PolyData->IsShadow) printf("!! GLORG!!! %08X\n", PolygonList[NumOpaqueFinalPolys].PolyData->Attr);
// pass 2: if needed, render translucent pixels that are against background pixels // pass 2: if needed, render translucent pixels that are against background pixels
// when background alpha is zero, those need to be rendered with blending disabled // when background alpha is zero, those need to be rendered with blending disabled
if ((RenderClearAttr1 & 0x001F0000) == 0) if ((RenderClearAttr1 & 0x001F0000) == 0)
{ {
iptr = PolygonList[NumOpaqueFinalPolys].Indices;
curkey = 0xFFFFFFFF;
glDisable(GL_BLEND); glDisable(GL_BLEND);
for (int i = NumOpaqueFinalPolys; i < NumFinalPolys; i++) for (int i = 0; i < NumFinalPolys; )
{ {
RendererPolygon* rp = &PolygonList[i]; RendererPolygon* rp = &PolygonList[i];
if (rp->RenderKey != curkey)
if (rp->PolyData->IsShadowMask)
{ {
u16* endptr = rp->Indices; // clear shadow bits in stencil buffer
u32 num = (u32)(endptr - iptr);
if (num) glDrawElements(GL_TRIANGLES, num, GL_UNSIGNED_SHORT, iptr);
iptr = rp->Indices; glStencilMask(0x80);
curkey = rp->RenderKey; glClear(GL_STENCIL_BUFFER_BIT);
// configure new one // draw actual shadow mask
// shadows aren't likely to pass against the clear-plane, so UseRenderShader(flags | RenderFlag_ShadowMask);
if (rp->PolyData->IsShadow) continue;
glDisable(GL_BLEND);
glColorMaski(0, GL_FALSE, GL_FALSE, GL_FALSE, GL_FALSE);
glColorMaski(1, GL_FALSE, GL_FALSE, GL_FALSE, GL_FALSE);
glDepthMask(GL_FALSE);
glDepthFunc(GL_LESS);
glStencilFunc(GL_EQUAL, 0xFF, 0xFE);
glStencilOp(GL_KEEP, GL_INVERT, GL_KEEP);
glStencilMask(0x01);
i += RenderPolygonBatch(i);
}
else if (rp->PolyData->Translucent)
{
// zorp // zorp
glDepthFunc(GL_LESS); glDepthFunc(GL_LESS);
u32 polyattr = rp->PolyData->Attr; u32 polyattr = rp->PolyData->Attr;
u32 polyid = (polyattr >> 24) & 0x3F; u32 polyid = (polyattr >> 24) & 0x3F;
glStencilFunc(GL_EQUAL, 0xFF, 0xFF); if (rp->PolyData->IsShadow)
{
// shadow against clear-plane will only pass if its polyID matches that of the clear plane
u32 clrpolyid = (RenderClearAttr1 >> 24) & 0x3F;
if (polyid != clrpolyid) { i++; continue; }
glEnable(GL_BLEND);
glColorMaski(0, GL_TRUE, GL_TRUE, GL_TRUE, GL_TRUE);
glColorMaski(1, GL_FALSE, GL_TRUE, GL_FALSE, GL_FALSE);
glStencilFunc(GL_EQUAL, 0xFE, 0xFF);
glStencilOp(GL_KEEP, GL_KEEP, GL_INVERT); glStencilOp(GL_KEEP, GL_KEEP, GL_INVERT);
glStencilMask(~(0x40|polyid)); // heheh glStencilMask(~(0x40|polyid)); // heheh
if (polyattr & (1<<11)) glDepthMask(GL_TRUE); if (polyattr & (1<<11)) glDepthMask(GL_TRUE);
else glDepthMask(GL_FALSE); else glDepthMask(GL_FALSE);
}
}
i += RenderPolygonBatch(i);
}
else
{ {
u16* endptr = &IndexBuffer[NumTriangles*3]; glStencilFunc(GL_EQUAL, 0xFF, 0xFE);
u32 num = (u32)(endptr - iptr); glStencilOp(GL_KEEP, GL_KEEP, GL_INVERT);
if (num) glDrawElements(GL_TRIANGLES, num, GL_UNSIGNED_SHORT, iptr); glStencilMask(~(0x40|polyid)); // heheh
if (polyattr & (1<<11)) glDepthMask(GL_TRUE);
else glDepthMask(GL_FALSE);
i += RenderPolygonBatch(i);
}
}
else
i++;
} }
glEnable(GL_BLEND); glEnable(GL_BLEND);
@ -658,22 +697,9 @@ void RenderSceneChunk(int y, int h)
// pass 3: translucent pixels // pass 3: translucent pixels
iptr = PolygonList[NumOpaqueFinalPolys].Indices; for (int i = 0; i < NumFinalPolys; )
curkey = 0xFFFFFFFF;
for (int i = NumOpaqueFinalPolys; i < NumFinalPolys; i++)
{ {
RendererPolygon* rp = &PolygonList[i]; RendererPolygon* rp = &PolygonList[i];
if (rp->RenderKey != curkey)
{
u16* endptr = rp->Indices;
u32 num = (u32)(endptr - iptr);
if (num) glDrawElements(GL_TRIANGLES, num, GL_UNSIGNED_SHORT, iptr);
iptr = rp->Indices;
curkey = rp->RenderKey;
// configure new one
if (rp->PolyData->IsShadowMask) if (rp->PolyData->IsShadowMask)
{ {
@ -695,10 +721,9 @@ void RenderSceneChunk(int y, int h)
glStencilFunc(GL_ALWAYS, 0x80, 0x80); glStencilFunc(GL_ALWAYS, 0x80, 0x80);
glStencilOp(GL_KEEP, GL_REPLACE, GL_KEEP); glStencilOp(GL_KEEP, GL_REPLACE, GL_KEEP);
glBindBuffer(GL_ARRAY_BUFFER, VertexBufferID); i += RenderPolygonBatch(i);
glBindVertexArray(VertexArrayID);
} }
else else if (rp->PolyData->Translucent)
{ {
UseRenderShader(flags | RenderFlag_Trans); UseRenderShader(flags | RenderFlag_Trans);
@ -718,22 +743,7 @@ void RenderSceneChunk(int y, int h)
glStencilOp(GL_KEEP, GL_KEEP, GL_ZERO); glStencilOp(GL_KEEP, GL_KEEP, GL_ZERO);
glStencilMask(0x80); glStencilMask(0x80);
{ RenderSinglePolygon(i);
u16* _endptr = &IndexBuffer[NumTriangles*3];
for (int j = i; j < NumFinalPolys; j++)
{
RendererPolygon* rp = &PolygonList[j];
if (!rp->PolyData->IsShadow)
{
_endptr = rp->Indices;
break;
}
// berg.
}
u32 num = (u32)(_endptr - iptr);
if (num) glDrawElements(GL_TRIANGLES, num, GL_UNSIGNED_SHORT, iptr);
}
glEnable(GL_BLEND); glEnable(GL_BLEND);
glColorMaski(0, GL_TRUE, GL_TRUE, GL_TRUE, GL_TRUE); glColorMaski(0, GL_TRUE, GL_TRUE, GL_TRUE, GL_TRUE);
@ -742,6 +752,12 @@ void RenderSceneChunk(int y, int h)
glStencilFunc(GL_EQUAL, 0xC0|polyid, 0x80); glStencilFunc(GL_EQUAL, 0xC0|polyid, 0x80);
glStencilOp(GL_KEEP, GL_KEEP, GL_REPLACE); glStencilOp(GL_KEEP, GL_KEEP, GL_REPLACE);
glStencilMask(0x7F); glStencilMask(0x7F);
if (polyattr & (1<<11)) glDepthMask(GL_TRUE);
else glDepthMask(GL_FALSE);
RenderSinglePolygon(i);
i++;
} }
else else
{ {
@ -752,18 +768,15 @@ void RenderSceneChunk(int y, int h)
glStencilFunc(GL_NOTEQUAL, 0x40|polyid, 0x7F); glStencilFunc(GL_NOTEQUAL, 0x40|polyid, 0x7F);
glStencilOp(GL_KEEP, GL_KEEP, GL_REPLACE); glStencilOp(GL_KEEP, GL_KEEP, GL_REPLACE);
glStencilMask(0x7F); glStencilMask(0x7F);
}
if (polyattr & (1<<11)) glDepthMask(GL_TRUE); if (polyattr & (1<<11)) glDepthMask(GL_TRUE);
else glDepthMask(GL_FALSE); else glDepthMask(GL_FALSE);
}
}
}
{ i += RenderPolygonBatch(i);
u16* endptr = &IndexBuffer[NumTriangles*3]; }
u32 num = (u32)(endptr - iptr); }
if (num) glDrawElements(GL_TRIANGLES, num, GL_UNSIGNED_SHORT, iptr); else
i++;
} }
} }
@ -835,9 +848,14 @@ void RenderFrame()
if (Antialias) glBindFramebuffer(GL_FRAMEBUFFER, FramebufferID[2]); if (Antialias) glBindFramebuffer(GL_FRAMEBUFFER, FramebufferID[2]);
else glBindFramebuffer(GL_FRAMEBUFFER, FramebufferID[FrontBuffer]); else glBindFramebuffer(GL_FRAMEBUFFER, FramebufferID[FrontBuffer]);
if (RenderDispCnt & (1<<3))
glBlendFuncSeparate(GL_SRC_ALPHA, GL_ONE_MINUS_SRC_ALPHA, GL_ONE, GL_ONE);
else
glBlendFuncSeparate(GL_ONE, GL_ZERO, GL_ONE, GL_ONE);
glDisable(GL_BLEND); glDisable(GL_BLEND);
glColorMaski(0, GL_TRUE, GL_TRUE, GL_TRUE, GL_TRUE); glColorMaski(0, GL_TRUE, GL_TRUE, GL_TRUE, GL_TRUE);
glColorMaski(1, GL_TRUE, GL_TRUE, GL_TRUE, GL_FALSE); glColorMaski(1, GL_TRUE, GL_TRUE, GL_TRUE, GL_TRUE);
glDepthMask(GL_TRUE); glDepthMask(GL_TRUE);
glStencilMask(0xFF); glStencilMask(0xFF);

View File

@ -100,8 +100,8 @@
\ \
func(GLDRAWBUFFERS, glDrawBuffers); \ func(GLDRAWBUFFERS, glDrawBuffers); \
\ \
func(GLBLENDFUNCSEPARATEI, glBlendFuncSeparatei); \ func(GLBLENDFUNCSEPARATE, glBlendFuncSeparate); \
func(GLBLENDEQUATIONSEPARATEI, glBlendEquationSeparatei); \ func(GLBLENDEQUATIONSEPARATE, glBlendEquationSeparate); \
\ \
func(GLCOLORMASKI, glColorMaski); \ func(GLCOLORMASKI, glColorMaski); \
\ \