rasterize: unexpected necessity: render any convex polygon without triangulating (more complex polygons can be created by culling)

This commit is contained in:
zeromus 2009-02-27 08:53:03 +00:00
parent 51ed1af70f
commit 3fc3cb346f
1 changed files with 90 additions and 143 deletions

View File

@ -26,6 +26,10 @@
//the shape rasterizers contained herein are based on code supplied by Chris Hecker from //the shape rasterizers contained herein are based on code supplied by Chris Hecker from
//http://chrishecker.com/Miscellaneous_Technical_Articles //http://chrishecker.com/Miscellaneous_Technical_Articles
//The worst case we've managed to think of so far would be a viewport zoomed in a little bit
//on a diamond, with cut-out bits in all four corners
#define MAX_CLIPPED_VERTS 8
#include "rasterize.h" #include "rasterize.h"
#include <algorithm> #include <algorithm>
@ -166,11 +170,12 @@ struct Fragment
u8 pad[5]; u8 pad[5];
}; };
static VERT* verts[4]; static VERT* verts[MAX_CLIPPED_VERTS];
static VERT* sortedVerts[MAX_CLIPPED_VERTS];
INLINE static void SubmitVertex(int vert_index, VERT* rawvert) INLINE static void SubmitVertex(int vert_index, VERT& rawvert)
{ {
verts[vert_index] = rawvert; verts[vert_index] = &rawvert;
} }
static Fragment screen[256*192]; static Fragment screen[256*192];
@ -349,42 +354,6 @@ struct Shader
} shader; } shader;
struct Interpolator
{
float dx, dy;
float Z, pZ;
struct {
float x,y,z;
} point0;
Interpolator(float x1, float x2, float x3, float y1, float y2, float y3, float z1, float z2, float z3)
{
float A = (z3 - z1) * (y2 - y1) - (z2 - z1) * (y3 - y1);
float B = (x3 - x1) * (z2 - z1) - (x2 - x1) * (z3 - z1);
float C = (x2 - x1) * (y3 - y1) - (x3 - x1) * (y2 - y1);
dx = -(float)A / C;
dy = -(float)B / C;
point0.x = x1;
point0.y = y1;
point0.z = z1;
}
void init(int x, int y)
{
Z = point0.z + dx * (x-point0.x) + dy * (y-point0.y);
}
FORCEINLINE int cur() { return iround(Z); }
FORCEINLINE void push() { pZ = Z; }
FORCEINLINE void pop() { Z = pZ; }
FORCEINLINE void incy() { Z += dy; }
FORCEINLINE void incx() { Z += dx; }
FORCEINLINE void incx(int count) { Z += dx*count; }
};
static void alphaBlend(Fragment::Color & dst, const Fragment::Color & src) static void alphaBlend(Fragment::Color & dst, const Fragment::Color & src)
{ {
if(gfx3d.enableAlphaBlending) if(gfx3d.enableAlphaBlending)
@ -566,7 +535,7 @@ typedef int fixed28_4;
static bool failure; static bool failure;
// handle floor divides and mods correctly // handle floor divides and mods correctly
inline void FloorDivMod( long Numerator, long Denominator, long &Floor, long &Mod ) inline void FloorDivMod(long Numerator, long Denominator, long &Floor, long &Mod)
{ {
//These must be caused by invalid or degenerate shapes.. not sure yet. //These must be caused by invalid or degenerate shapes.. not sure yet.
//check it out in the mario face intro of SM64 //check it out in the mario face intro of SM64
@ -628,8 +597,8 @@ inline long Ceil28_4( fixed28_4 Value ) {
struct edge_fx_fl { struct edge_fx_fl {
edge_fx_fl() {} edge_fx_fl() {}
edge_fx_fl(VERT **pVertices, int Top, int Bottom ); edge_fx_fl(int Top, int Bottom);
inline int Step( void ); inline int Step();
long X, XStep, Numerator, Denominator; // DDA info for x long X, XStep, Numerator, Denominator; // DDA info for x
long ErrorTerm; long ErrorTerm;
@ -659,8 +628,7 @@ struct edge_fx_fl {
void doStepExtraInterpolants() { for(int i=0;i<NUM_INTERPOLANTS;i++) interpolants[i].doStepExtra(); } void doStepExtraInterpolants() { for(int i=0;i<NUM_INTERPOLANTS;i++) interpolants[i].doStepExtra(); }
}; };
edge_fx_fl::edge_fx_fl( VERT **verts, int Top, int Bottom ) edge_fx_fl::edge_fx_fl(int Top, int Bottom) {
{
Y = Ceil28_4(verts[Top]->y); Y = Ceil28_4(verts[Top]->y);
int YEnd = Ceil28_4(verts[Bottom]->y); int YEnd = Ceil28_4(verts[Bottom]->y);
Height = YEnd - Y; Height = YEnd - Y;
@ -690,7 +658,7 @@ edge_fx_fl::edge_fx_fl( VERT **verts, int Top, int Bottom )
} }
} }
inline int edge_fx_fl::Step( void ) { inline int edge_fx_fl::Step() {
X += XStep; Y++; Height--; X += XStep; Y++; Height--;
doStepInterpolants(); doStepInterpolants();
@ -703,8 +671,8 @@ inline int edge_fx_fl::Step( void ) {
return Height; return Height;
} }
//draws a single scanline
void hecker_DrawScanLine(edge_fx_fl *pLeft, edge_fx_fl *pRight) static void drawscanline(edge_fx_fl *pLeft, edge_fx_fl *pRight)
{ {
int XStart = pLeft->X; int XStart = pLeft->X;
int width = pRight->X - XStart; int width = pRight->X - XStart;
@ -747,60 +715,93 @@ void hecker_DrawScanLine(edge_fx_fl *pLeft, edge_fx_fl *pRight)
} }
} }
static void runscanline(edge_fx_fl *left, edge_fx_fl *right) //runs several scanlines, until an edge is finished
static void runscanlines(edge_fx_fl *left, edge_fx_fl *right)
{ {
//do not overstep either of the edges //do not overstep either of the edges
int Height = min(left->Height,right->Height); int Height = min(left->Height,right->Height);
while(Height--) { while(Height--) {
hecker_DrawScanLine(left,right); drawscanline(left,right);
left->Step(); left->Step();
right->Step(); right->Step();
} }
} }
//This function can handle a quad or a triangle. A triangle is just a quad with a duped vert. //rotates verts counterclockwise
template<int type>
inline static void rot_verts() {
#define ROTSWAP(X) if(type>X) swap(verts[X-1],verts[X]);
ROTSWAP(1); ROTSWAP(2); ROTSWAP(3); ROTSWAP(4);
ROTSWAP(5); ROTSWAP(6); ROTSWAP(7);
}
//rotate verts until vert0.y is minimum, and then vert0.x is minimum in case of ties
//this is a necessary precondition for our shape engine
template<int type>
static void sort_verts(bool backwards) {
//if the verts are backwards, reorder them first
if(backwards)
for(int i=0;i<type/2;i++)
swap(verts[i],verts[type-i-1]);
for(;;)
{
//this was the only way we could get this to unroll
#define CHECKY(X) if(type>X) if(verts[0]->y > verts[X]->y) goto doswap;
CHECKY(1); CHECKY(2); CHECKY(3); CHECKY(4);
CHECKY(5); CHECKY(6); CHECKY(7);
break;
doswap:
rot_verts<type>();
}
while(verts[0]->y == verts[1]->y && verts[0]->x > verts[1]->x)
rot_verts<type>();
}
//This function can handle any convex N-gon up to octagons
//verts must be clockwise. //verts must be clockwise.
//The algorithm used here is of my own devising... as far as I know. //I didnt reference anything for this algorithm but it seems like I've seen it somewhere before.
static void shape_engine() static void shape_engine(int type, bool backwards)
{ {
failure = false; failure = false;
VERT* v[4] = {verts[0],verts[1],verts[2],verts[3]}; switch(type) {
case 3: sort_verts<3>(backwards); break;
//rotate verts until vert0.y is minimum, and then vert0.x is minimum in case of ties case 4: sort_verts<4>(backwards); break;
//this will reduce the complexity of our logic case 5: sort_verts<5>(backwards); break;
while(v[0]->y > v[1]->y || v[0]->y > v[2]->y || v[0]->y > v[3]->y) { case 6: sort_verts<6>(backwards); break;
swap(v[0],v[1]); case 7: sort_verts<7>(backwards); break;
swap(v[1],v[2]); case 8: sort_verts<8>(backwards); break;
swap(v[2],v[3]); default: printf("skipping type %d\n",type); return;
} }
while(v[0]->y == v[1]->y && v[0]->x > v[1]->x) {
swap(v[0],v[1]);
swap(v[1],v[2]);
swap(v[2],v[3]);
}
//we are going to step around the polygon in both directions starting from vert 0. //we are going to step around the polygon in both directions starting from vert 0.
//right edges will be stepped over clockwise and left edges stepped over counterclockwise. //right edges will be stepped over clockwise and left edges stepped over counterclockwise.
//these variables track that stepping, but in order to facilitate wrapping we start extra high //these variables track that stepping, but in order to facilitate wrapping we start extra high
//for the counter we're decrementing. //for the counter we're decrementing.
int lv = 4, rv = 0; int lv = type, rv = 0;
edge_fx_fl left, right; edge_fx_fl left, right;
bool step_left = true, step_right = true; bool step_left = true, step_right = true;
for(;;) { for(;;) {
//generate new edges if necessary. we must avoid regenerating edges when they are incomplete //generate new edges if necessary. we must avoid regenerating edges when they are incomplete
//so that they can be continued on down the shape //so that they can be continued on down the shape
if(step_left) left = edge_fx_fl(v,lv&3,lv-1); assert(rv != type);
if(step_right) right = edge_fx_fl(v,rv&3,rv+1); int _lv = lv==type?0:lv; //make sure that we ask for vert 0 when the variable contains the starting value
if(step_left) left = edge_fx_fl(_lv,lv-1);
if(step_right) right = edge_fx_fl(rv,rv+1);
step_left = step_right = false; step_left = step_right = false;
//handle a failure in the edge setup. //handle a failure in the edge setup due to nutty polys
if(failure) if(failure)
return; return;
runscanline(&left,&right); runscanlines(&left,&right);
//if we ran out of an edge, step to the next one
if(right.Height == 0) { if(right.Height == 0) {
step_right = true; step_right = true;
rv++; rv++;
@ -893,7 +894,7 @@ static struct TClippedPoly
{ {
int type; int type;
POLY* poly; POLY* poly;
VERT clipVerts[16]; //how many? i cant imagine having more than 6 VERT clipVerts[MAX_CLIPPED_VERTS];
} clippedPolys[POLYLIST_SIZE*2]; } clippedPolys[POLYLIST_SIZE*2];
static int clippedPolyCounter; static int clippedPolyCounter;
@ -1035,33 +1036,22 @@ static void clipPoly(POLY* poly)
clipPolyVsPlane(1, 1); clipPolyVsPlane(1, 1);
clipPolyVsPlane(2, -1); clipPolyVsPlane(2, -1);
clipPolyVsPlane(2, 1); clipPolyVsPlane(2, 1);
//TODO - we need to parameterize back plane clipping //TODO - we need to parameterize back plane clipping
if(tempClippedPoly.type < 3) if(tempClippedPoly.type < 3)
{ {
//a totally clipped poly. discard it. //a totally clipped poly. discard it.
//or, a degenerate poly. we're not handling these right now //or, a degenerate poly. we're not handling these right now
} }
else if(tempClippedPoly.type < 5) else
{ {
//TODO - build right in this list instead of copying
clippedPolys[clippedPolyCounter] = tempClippedPoly; clippedPolys[clippedPolyCounter] = tempClippedPoly;
clippedPolys[clippedPolyCounter].poly = poly; clippedPolys[clippedPolyCounter].poly = poly;
clippedPolyCounter++; clippedPolyCounter++;
} }
else
{
//turn into a triangle fan. no point even trying to make quads since those would have to get split anyway.
//well, maybe it could end up being faster.
for(int i=0;i<tempClippedPoly.type-2;i++)
{
clippedPolys[clippedPolyCounter].type = 3;
clippedPolys[clippedPolyCounter].poly = poly;
clippedPolys[clippedPolyCounter].clipVerts[0] = tempClippedPoly.clipVerts[0];
clippedPolys[clippedPolyCounter].clipVerts[1] = tempClippedPoly.clipVerts[i+1];
clippedPolys[clippedPolyCounter].clipVerts[2] = tempClippedPoly.clipVerts[i+2];
clippedPolyCounter++;
}
}
} }
static void SoftRastRender() static void SoftRastRender()
@ -1128,19 +1118,15 @@ static void SoftRastRender()
//iterate over polys //iterate over polys
bool needInitTexture = true; bool needInitTexture = true;
polynum = 0;
for(int i=0;i<clippedPolyCounter;i++) for(int i=0;i<clippedPolyCounter;i++)
{ {
polynum = i;
TClippedPoly &clippedPoly = clippedPolys[i]; TClippedPoly &clippedPoly = clippedPolys[i];
POLY *poly = clippedPoly.poly; POLY *poly = clippedPoly.poly;
int type = clippedPoly.type; int type = clippedPoly.type;
VERT* verts[4] = { VERT* verts = &clippedPoly.clipVerts[0];
&clippedPoly.clipVerts[0],
&clippedPoly.clipVerts[1],
&clippedPoly.clipVerts[2],
type==4?&clippedPoly.clipVerts[3]:0
};
if(i == 0 || lastPolyAttr != poly->polyAttr) if(i == 0 || lastPolyAttr != poly->polyAttr)
{ {
@ -1152,12 +1138,12 @@ static void SoftRastRender()
//this should be moved to gfx3d, but first we need to redo the way the lists are built //this should be moved to gfx3d, but first we need to redo the way the lists are built
//because it is too convoluted right now. //because it is too convoluted right now.
//(must we throw out verts if a poly gets backface culled? if not, then it might be easier) //(must we throw out verts if a poly gets backface culled? if not, then it might be easier)
//TODO - is this good enough for quads? we think so. //TODO - is this good enough for quads and other shapes? we think so.
float ab[2], ac[2]; float ab[2], ac[2];
Vector2Copy(ab, verts[1]->coord); Vector2Copy(ab, verts[1].coord);
Vector2Copy(ac, verts[2]->coord); Vector2Copy(ac, verts[2].coord);
Vector2Subtract(ab, verts[0]->coord); Vector2Subtract(ab, verts[0].coord);
Vector2Subtract(ac, verts[0]->coord); Vector2Subtract(ac, verts[0].coord);
float cross = Vector2Cross(ab, ac); float cross = Vector2Cross(ab, ac);
bool backfacing = (cross<0); bool backfacing = (cross<0);
@ -1181,54 +1167,15 @@ static void SoftRastRender()
//which is currently just a float //which is currently just a float
for(int i=0;i<type;i++) for(int i=0;i<type;i++)
for(int j=0;j<2;j++) for(int j=0;j<2;j++)
verts[i]->coord[j] = iround(16.0f * verts[i]->coord[j]); verts[i].coord[j] = iround(16.0f * verts[i].coord[j]);
//hmm... shader gets setup every time because it depends on sampler which may have just changed //hmm... shader gets setup every time because it depends on sampler which may have just changed
shader.setup(poly->polyAttr); shader.setup(poly->polyAttr);
//note that when we build our triangle vert lists, we reorder them for our renderer. for(int i=0;i<MAX_CLIPPED_VERTS;i++)
//we should probably fix the renderer so we dont have to do this; ::verts[i] = &verts[i];
//but then again, what does it matter?
if(type == 4)
{
if(backfacing)
{
SubmitVertex(3,verts[0]);
SubmitVertex(2,verts[1]);
SubmitVertex(1,verts[2]);
SubmitVertex(0,verts[3]);
shape_engine();polynum++;
}
else
{
SubmitVertex(3,verts[3]);
SubmitVertex(2,verts[2]);
SubmitVertex(1,verts[1]);
SubmitVertex(0,verts[0]);
shape_engine();polynum++;
}
}
else if(type == 3)
{
if(backfacing)
{
SubmitVertex(3,verts[0]);
SubmitVertex(2,verts[0]);
SubmitVertex(1,verts[1]);
SubmitVertex(0,verts[2]);
shape_engine();polynum++;
}
else
{
SubmitVertex(3,verts[2]);
SubmitVertex(2,verts[2]);
SubmitVertex(1,verts[1]);
SubmitVertex(0,verts[0]);
shape_engine();polynum++;
}
} else printf("skipping type %d\n",type);
shape_engine(type,backfacing);
} }
// printf("rendered %d of %d polys after backface culling\n",gfx3d.polylist->count-culled,gfx3d.polylist->count); // printf("rendered %d of %d polys after backface culling\n",gfx3d.polylist->count-culled,gfx3d.polylist->count);