From 34ba061b603926c07bcba0c4d9d848629e1d393b Mon Sep 17 00:00:00 2001 From: Jannik Vogel Date: Fri, 17 Jul 2015 03:57:42 +0200 Subject: [PATCH] Better and complete buffering for the inline-buffers --- hw/xbox/nv2a.c | 176 ++++++++++++++++++++++++------------------------- 1 file changed, 85 insertions(+), 91 deletions(-) diff --git a/hw/xbox/nv2a.c b/hw/xbox/nv2a.c index 480e89067f..10400de12f 100644 --- a/hw/xbox/nv2a.c +++ b/hw/xbox/nv2a.c @@ -1309,11 +1309,14 @@ typedef struct VertexAttribute { unsigned int converted_size; unsigned int converted_count; + float *inline_buffer_buffer; + GLint gl_count; GLenum gl_type; GLboolean gl_normalize; GLuint gl_converted_buffer; + GLuint gl_inline_buffer_buffer; } VertexAttribute; typedef struct VertexShaderConstant { @@ -1403,13 +1406,6 @@ typedef struct TextureBinding { unsigned int refcnt; } TextureBinding; -typedef struct InlineVertexBufferEntry { - float position[4]; - float weight[4]; - float diffuse[4]; - float tex_coord[NV2A_MAX_TEXTURES][4]; -} InlineVertexBufferEntry; - typedef struct KelvinState { hwaddr dma_notifies; hwaddr dma_state; @@ -1537,8 +1533,6 @@ typedef struct PGRAPHState { uint32_t inline_elements[NV2A_MAX_BATCH_LENGTH]; unsigned int inline_buffer_length; - InlineVertexBufferEntry inline_buffer[NV2A_MAX_BATCH_LENGTH]; - GLuint gl_inline_buffer_buffer; GLuint gl_element_buffer; GLuint gl_memory_buffer; @@ -3759,9 +3753,9 @@ static void pgraph_init(NV2AState *d) for (i=0; ivertex_attributes[i].gl_converted_buffer); + glGenBuffers(1, &pg->vertex_attributes[i].gl_inline_buffer_buffer); } glGenBuffers(1, &pg->gl_inline_array_buffer); - glGenBuffers(1, &pg->gl_inline_buffer_buffer); glGenBuffers(1, &pg->gl_element_buffer); glGenBuffers(1, &pg->gl_memory_buffer); @@ -3858,31 +3852,39 @@ static unsigned int kelvin_map_texgen(uint32_t parameter, unsigned int channel) return texgen; } -static void finish_inline_vertex(PGRAPHState *pg) +static void allocate_inline_buffer_vertices(PGRAPHState *pg, unsigned int attr) +{ + int i; + VertexAttribute *attribute = &pg->vertex_attributes[attr]; + + if (attribute->inline_buffer_buffer || pg->inline_buffer_length == 0) { + return; + } + + /* Now upload the previous attribute value */ + attribute->inline_buffer_buffer = g_malloc(NV2A_MAX_BATCH_LENGTH + * sizeof(float) * 4); + for (i = 0; i < pg->inline_buffer_length; i++) { + memcpy(&attribute->inline_buffer_buffer[i * 4], + attribute->inline_value, + sizeof(float) * 4); + } +} + +static void finish_inline_buffer_vertex(PGRAPHState *pg) { int i; assert(pg->inline_buffer_length < NV2A_MAX_BATCH_LENGTH); - InlineVertexBufferEntry *entry = - &pg->inline_buffer[pg->inline_buffer_length]; - - memcpy(entry->position, - pg->vertex_attributes[NV2A_VERTEX_ATTR_POSITION].inline_value, - sizeof(float) * 4); - - memcpy(entry->weight, - pg->vertex_attributes[NV2A_VERTEX_ATTR_WEIGHT].inline_value, - sizeof(float) * 4); - - memcpy(entry->diffuse, - pg->vertex_attributes[NV2A_VERTEX_ATTR_DIFFUSE].inline_value, - sizeof(float) * 4); - - for (i = 0; i < NV2A_MAX_TEXTURES; i++) { - memcpy(entry->tex_coord[i], - pg->vertex_attributes[NV2A_VERTEX_ATTR_TEXTURE0+i].inline_value, - sizeof(float)*4); + for (i = 0; i < NV2A_VERTEXSHADER_ATTRIBUTES; i++) { + VertexAttribute *attribute = &pg->vertex_attributes[i]; + if (attribute->inline_buffer_buffer) { + memcpy(&attribute->inline_buffer_buffer[ + pg->inline_buffer_length * 4], + attribute->inline_value, + sizeof(float) * 4); + } } pg->inline_buffer_length++; @@ -4597,9 +4599,12 @@ static void pgraph_method(NV2AState *d, case NV097_SET_VERTEX4F ... NV097_SET_VERTEX4F + 12: { slot = (class_method - NV097_SET_VERTEX4F) / 4; - pg->vertex_attributes[NV2A_VERTEX_ATTR_POSITION].inline_value[slot] = *(float*)¶meter; + VertexAttribute *attribute = + &pg->vertex_attributes[NV2A_VERTEX_ATTR_POSITION]; + allocate_inline_buffer_vertices(pg, NV2A_VERTEX_ATTR_POSITION); + attribute->inline_value[slot] = *(float*)¶meter; if (slot == 3) { - finish_inline_vertex(pg); + finish_inline_buffer_vertex(pg); } break; } @@ -4717,48 +4722,31 @@ static void pgraph_method(NV2AState *d, if (parameter == NV097_SET_BEGIN_END_OP_END) { if (pg->inline_buffer_length) { - // pgraph_bind_vertex_attributes(...) + for (i = 0; i < NV2A_VERTEXSHADER_ATTRIBUTES; i++) { + VertexAttribute *attribute = &pg->vertex_attributes[i]; - glBindBuffer(GL_ARRAY_BUFFER, pg->gl_inline_buffer_buffer); - glBufferData(GL_ARRAY_BUFFER, - pg->inline_buffer_length - * sizeof(InlineVertexBufferEntry), - pg->inline_buffer, - GL_DYNAMIC_DRAW); + if (attribute->inline_buffer_buffer) { - glVertexAttribPointer(NV2A_VERTEX_ATTR_POSITION, - 4, - GL_FLOAT, - GL_FALSE, - sizeof(InlineVertexBufferEntry), - (void*)offsetof(InlineVertexBufferEntry, position)); - glEnableVertexAttribArray(NV2A_VERTEX_ATTR_POSITION); + glBindBuffer(GL_ARRAY_BUFFER, + attribute->gl_inline_buffer_buffer); + glBufferData(GL_ARRAY_BUFFER, + pg->inline_buffer_length + * sizeof(float) * 4, + attribute->inline_buffer_buffer, + GL_DYNAMIC_DRAW); - glVertexAttribPointer(NV2A_VERTEX_ATTR_WEIGHT, - 4, - GL_FLOAT, - GL_FALSE, - sizeof(InlineVertexBufferEntry), - (void*)offsetof(InlineVertexBufferEntry, weight)); - glEnableVertexAttribArray(NV2A_VERTEX_ATTR_WEIGHT); + /* Clear buffer for next batch */ + g_free(attribute->inline_buffer_buffer); + attribute->inline_buffer_buffer = NULL; - glVertexAttribPointer(NV2A_VERTEX_ATTR_DIFFUSE, - 4, - GL_FLOAT, - GL_FALSE, - sizeof(InlineVertexBufferEntry), - (void*)offsetof(InlineVertexBufferEntry, diffuse)); - glEnableVertexAttribArray(NV2A_VERTEX_ATTR_DIFFUSE); + glVertexAttribPointer(i, 4, GL_FLOAT, GL_FALSE, 0, 0); + glEnableVertexAttribArray(i); + } else { + glDisableVertexAttribArray(i); + + glVertexAttrib4fv(i, attribute->inline_value); + } - for (i=0; igl_primitive_mode, @@ -4899,6 +4887,7 @@ static void pgraph_method(NV2AState *d, pg->inline_elements_length = 0; pg->inline_array_length = 0; pg->inline_buffer_length = 0; + } pgraph_set_surface_dirty(pg, true, depth_test || stencil_test); @@ -5024,45 +5013,50 @@ static void pgraph_method(NV2AState *d, case NV097_SET_VERTEX_DATA2F_M ... NV097_SET_VERTEX_DATA2F_M + 0x7c: { - slot = (class_method - NV097_SET_VERTEX_DATA2F_M) / 8; - unsigned int part = - ((class_method - NV097_SET_VERTEX_DATA2F_M) % 8) / 4; - pg->vertex_attributes[slot].inline_value[part] = *(float*)¶meter; - pg->vertex_attributes[slot].inline_value[2] = 0.0; - pg->vertex_attributes[slot].inline_value[3] = 1.0; + slot = (class_method - NV097_SET_VERTEX_DATA2F_M) / 4; + unsigned int part = slot % 2; + slot /= 2; + VertexAttribute *attribute = &pg->vertex_attributes[slot]; + allocate_inline_buffer_vertices(pg, slot); + attribute->inline_value[part] = *(float*)¶meter; + /* FIXME: Should these really be set to 0.0 and 1.0 ? Conditions? */ + attribute->inline_value[2] = 0.0; + attribute->inline_value[3] = 1.0; if ((slot == 0) && (part == 1)) { - finish_inline_vertex(pg); + finish_inline_buffer_vertex(pg); } break; } case NV097_SET_VERTEX_DATA4F_M ... NV097_SET_VERTEX_DATA4F_M + 0xfc: { - slot = (class_method - NV097_SET_VERTEX_DATA4F_M) / 16; - unsigned int part = - ((class_method - NV097_SET_VERTEX_DATA4F_M) % 16) / 4; - pg->vertex_attributes[slot].inline_value[part] = *(float*)¶meter; + slot = (class_method - NV097_SET_VERTEX_DATA4F_M) / 4; + unsigned int part = slot % 4; + slot /= 4; + VertexAttribute *attribute = &pg->vertex_attributes[slot]; + allocate_inline_buffer_vertices(pg, slot); + attribute->inline_value[part] = *(float*)¶meter; if ((slot == 0) && (part == 3)) { - finish_inline_vertex(pg); + finish_inline_buffer_vertex(pg); } break; } case NV097_SET_VERTEX_DATA4UB ... - NV097_SET_VERTEX_DATA4UB + 0x3c: + NV097_SET_VERTEX_DATA4UB + 0x3c: { slot = (class_method - NV097_SET_VERTEX_DATA4UB) / 4; - pg->vertex_attributes[slot].inline_value[0] = - (parameter & 0xFF) / 255.0; - pg->vertex_attributes[slot].inline_value[1] = - ((parameter >> 8) & 0xFF) / 255.0; - pg->vertex_attributes[slot].inline_value[2] = - ((parameter >> 16) & 0xFF) / 255.0; - pg->vertex_attributes[slot].inline_value[3] = - ((parameter >> 24) & 0xFF) / 255.0; + VertexAttribute *attribute = &pg->vertex_attributes[slot]; + allocate_inline_buffer_vertices(pg, slot); + attribute->inline_value[0] = (parameter & 0xFF) / 255.0; + attribute->inline_value[1] = ((parameter >> 8) & 0xFF) / 255.0; + attribute->inline_value[2] = ((parameter >> 16) & 0xFF) / 255.0; + attribute->inline_value[3] = ((parameter >> 24) & 0xFF) / 255.0; if (slot == 0) { - finish_inline_vertex(pg); + finish_inline_buffer_vertex(pg); + assert(false); /* FIXME: Untested */ } break; + } case NV097_SET_SEMAPHORE_OFFSET: kelvin->semaphore_offset = parameter;