Fixing wraparound.

This still needs a tremendous amount of cleanup.
This commit is contained in:
Ben Vanik 2013-10-13 21:18:23 -07:00
parent 4887234bba
commit 2eed0b1575
2 changed files with 334 additions and 273 deletions

View File

@ -30,6 +30,7 @@ RingBufferWorker::RingBufferWorker(xe_memory_ref memory) :
read_ptr_update_freq_ = 0; read_ptr_update_freq_ = 0;
read_ptr_writeback_ptr_ = 0; read_ptr_writeback_ptr_ = 0;
write_ptr_index_ = 0; write_ptr_index_ = 0;
write_ptr_max_index_ = 0;
} }
RingBufferWorker::~RingBufferWorker() { RingBufferWorker::~RingBufferWorker() {
@ -46,6 +47,9 @@ void RingBufferWorker::Initialize(GraphicsDriver* driver,
uint32_t original_size = 1 << (0x1C - page_count - 1); uint32_t original_size = 1 << (0x1C - page_count - 1);
primary_buffer_size_ = original_size; primary_buffer_size_ = original_size;
read_ptr_index_ = 0; read_ptr_index_ = 0;
// Tell the driver what to use for translation.
driver_->set_address_translation(primary_buffer_ptr_ & ~0x1FFFFFFF);
} }
void RingBufferWorker::EnableReadPointerWriteBack(uint32_t ptr, void RingBufferWorker::EnableReadPointerWriteBack(uint32_t ptr,
@ -60,6 +64,7 @@ void RingBufferWorker::EnableReadPointerWriteBack(uint32_t ptr,
} }
void RingBufferWorker::UpdateWritePointer(uint32_t value) { void RingBufferWorker::UpdateWritePointer(uint32_t value) {
write_ptr_max_index_ = MAX(write_ptr_max_index_, value);
write_ptr_index_ = value; write_ptr_index_ = value;
SetEvent(write_ptr_index_event_); SetEvent(write_ptr_index_event_);
} }
@ -82,6 +87,7 @@ void RingBufferWorker::Pump() {
// Bring local so we don't have to worry about them changing out from under // Bring local so we don't have to worry about them changing out from under
// us. // us.
uint32_t write_ptr_index = write_ptr_index_; uint32_t write_ptr_index = write_ptr_index_;
uint32_t write_ptr_max_index = write_ptr_max_index_;
if (read_ptr_index_ == write_ptr_index) { if (read_ptr_index_ == write_ptr_index) {
return; return;
} }
@ -89,24 +95,9 @@ void RingBufferWorker::Pump() {
// Process the new commands. // Process the new commands.
XELOGGPU("Ring buffer thread work"); XELOGGPU("Ring buffer thread work");
// Handle wrapping around. // Execute. Note that we handle wraparound transparently.
// TODO(benvanik): verify this is correct. ExecutePrimaryBuffer(read_ptr_index_, write_ptr_index);
if (write_ptr_index_ < read_ptr_index_) {
// We wrapped. Execute all instructions until the end and go back to 0.
XELOGGPU("Ring buffer wrapped back to zero (read %0.8X, write %0.8X)",
read_ptr_index_, write_ptr_index);
uint32_t pre_length = (primary_buffer_size_ / 4) - read_ptr_index_;
if (pre_length) {
ExecuteSegment(primary_buffer_ptr_ + read_ptr_index_ * 4, pre_length);
}
read_ptr_index_ = 0;
}
uint32_t length = write_ptr_index - read_ptr_index_;
if (length) {
ExecuteSegment(primary_buffer_ptr_ + read_ptr_index_ * 4, length);
read_ptr_index_ = write_ptr_index; read_ptr_index_ = write_ptr_index;
}
// TODO(benvanik): use read_ptr_update_freq_ and only issue after moving // TODO(benvanik): use read_ptr_update_freq_ and only issue after moving
// that many indices. // that many indices.
@ -115,36 +106,88 @@ void RingBufferWorker::Pump() {
} }
} }
void RingBufferWorker::ExecuteSegment(uint32_t ptr, uint32_t length) { void RingBufferWorker::ExecutePrimaryBuffer(
uint8_t* p = xe_memory_addr(memory_); uint32_t start_index, uint32_t end_index) {
RegisterFile* regs = driver_->register_file(); // Adjust pointer base.
uint32_t ptr = primary_buffer_ptr_ + start_index * 4;
ptr = (primary_buffer_ptr_ & ~0x1FFFFFFF) | (ptr & 0x1FFFFFFF);
uint32_t end_ptr = primary_buffer_ptr_ + end_index * 4;
end_ptr = (primary_buffer_ptr_ & ~0x1FFFFFFF) | (end_ptr & 0x1FFFFFFF);
XELOGGPU("[%.8X] ExecutePrimaryBuffer(%dw -> %dw)",
start_index, end_index);
// Execute commands!
PacketArgs args;
args.ptr = ptr;
args.base_ptr = primary_buffer_ptr_;
args.max_address = primary_buffer_ptr_ + primary_buffer_size_ * 4;
args.ptr_mask = (primary_buffer_size_ / 4) - 1;
uint32_t n = 0;
while (args.ptr != end_ptr) {
n += ExecutePacket(args);
}
if (end_index > start_index) {
XEASSERT(n == (end_index - start_index));
}
XELOGGPU(" ExecutePrimaryBuffer End");
}
void RingBufferWorker::ExecuteIndirectBuffer(uint32_t ptr, uint32_t length) {
// Adjust pointer base. // Adjust pointer base.
ptr = (primary_buffer_ptr_ & ~0x1FFFFFFF) | (ptr & 0x1FFFFFFF); ptr = (primary_buffer_ptr_ & ~0x1FFFFFFF) | (ptr & 0x1FFFFFFF);
// Tell the driver what to use for translation. XELOGGPU("[%.8X] ExecuteIndirectBuffer(%dw)", ptr, length);
driver_->set_address_translation(primary_buffer_ptr_ & ~0x1FFFFFFF);
// Execute commands!
PacketArgs args;
args.ptr = ptr;
args.base_ptr = ptr;
args.max_address = ptr + length * 4;
args.ptr_mask = 0;
for (uint32_t n = 0; n < length;) {
n += ExecutePacket(args);
XEASSERT(n <= length);
}
XELOGGPU(" ExecuteIndirectBuffer End");
}
#define LOG_DATA(count) \ #define LOG_DATA(count) \
for (uint32_t __m = 0; __m < count; __m++) { \ for (uint32_t __m = 0; __m < count; __m++) { \
XELOGGPU("[%.8X] %.8X", \ XELOGGPU("[%.8X] %.8X", \
ptr + (n + 1 + __m) * 4, \ packet_ptr + (1 + __m) * 4, \
XEGETUINT32BE(packet_base + 1 * 4 + __m * 4)); \ XEGETUINT32BE(packet_base + 1 * 4 + __m * 4)); \
} }
#define TRANSLATE_ADDR(p) \ #define TRANSLATE_ADDR(p) \
((p & ~0x3) + (primary_buffer_ptr_ & ~0x1FFFFFFF)) ((p & ~0x3) + (primary_buffer_ptr_ & ~0x1FFFFFFF))
XELOGGPU("[%.8X] CommandList(): executing %dw", ptr, length); void RingBufferWorker::AdvancePtr(PacketArgs& args, uint32_t n) {
args.ptr = args.ptr + n * 4;
if (args.ptr_mask) {
args.ptr =
args.base_ptr + (((args.ptr - args.base_ptr) / 4) & args.ptr_mask) * 4;
}
}
#define ADVANCE_PTR(n) AdvancePtr(args, n)
#define READ_PTR() \
XEGETUINT32BE(p + args.ptr)
#define READ_AND_ADVANCE_PTR() \
XEGETUINT32BE(p + args.ptr); ADVANCE_PTR(1);
// Execute commands! uint32_t RingBufferWorker::ExecutePacket(PacketArgs& args) {
for (uint32_t n = 0; n < length;) { uint8_t* p = xe_memory_addr(memory_);
const uint8_t* packet_base = p + ptr + n * 4; RegisterFile* regs = driver_->register_file();
const uint32_t packet = XEGETUINT32BE(packet_base);
uint32_t packet_ptr = args.ptr;
const uint8_t* packet_base = p + packet_ptr;
const uint32_t packet = READ_PTR();
ADVANCE_PTR(1);
const uint32_t packet_type = packet >> 30; const uint32_t packet_type = packet >> 30;
if (packet == 0) { if (packet == 0) {
n++; return 1;
continue;
} }
switch (packet_type) { switch (packet_type) {
@ -153,22 +196,23 @@ void RingBufferWorker::ExecuteSegment(uint32_t ptr, uint32_t length) {
// Type-0 packet. // Type-0 packet.
// Write count registers in sequence to the registers starting at // Write count registers in sequence to the registers starting at
// (base_index << 2). // (base_index << 2).
XELOGGPU("[%.8X] Packet(%.8X): set registers:", ptr + n * 4, XELOGGPU("[%.8X] Packet(%.8X): set registers:",
ptr + n * 4, packet); packet_ptr, packet);
uint32_t count = ((packet >> 16) & 0x3FFF) + 1; uint32_t count = ((packet >> 16) & 0x3FFF) + 1;
uint32_t base_index = (packet & 0xFFFF); uint32_t base_index = (packet & 0xFFFF);
for (uint32_t m = 0; m < count; m++) { for (uint32_t m = 0; m < count; m++) {
uint32_t reg_data = XEGETUINT32BE(packet_base + 1 * 4 + m * 4); uint32_t reg_data = READ_PTR();
const char* reg_name = xenos::GetRegisterName(base_index + m); const char* reg_name = xenos::GetRegisterName(base_index + m);
XELOGGPU("[%.8X] %.8X -> %.4X %s", XELOGGPU("[%.8X] %.8X -> %.4X %s",
ptr + (n + 1 + m) * 4, args.ptr,
reg_data, base_index + m, reg_name ? reg_name : ""); reg_data, base_index + m, reg_name ? reg_name : "");
ADVANCE_PTR(1);
// TODO(benvanik): exec write handler (if special). // TODO(benvanik): exec write handler (if special).
if (base_index + m < kXEGpuRegisterCount) { if (base_index + m < kXEGpuRegisterCount) {
regs->values[base_index + m].u32 = reg_data; regs->values[base_index + m].u32 = reg_data;
} }
} }
n += 1 + count; return 1 + count;
} }
break; break;
case 0x01: case 0x01:
@ -176,18 +220,20 @@ void RingBufferWorker::ExecuteSegment(uint32_t ptr, uint32_t length) {
// Type-1 packet. // Type-1 packet.
// Contains two registers of data. Type-0 should be more common. // Contains two registers of data. Type-0 should be more common.
XELOGGPU("[%.8X] Packet(%.8X): set registers:", XELOGGPU("[%.8X] Packet(%.8X): set registers:",
ptr + n * 4, packet); packet_ptr, packet);
uint32_t reg_index_1 = packet & 0x7FF; uint32_t reg_index_1 = packet & 0x7FF;
uint32_t reg_index_2 = (packet >> 11) & 0x7FF; uint32_t reg_index_2 = (packet >> 11) & 0x7FF;
uint32_t reg_data_1 = XEGETUINT32BE(packet_base + 1 * 4); uint32_t reg_ptr_1 = args.ptr;
uint32_t reg_data_2 = XEGETUINT32BE(packet_base + 2 * 4); uint32_t reg_data_1 = READ_AND_ADVANCE_PTR();
uint32_t reg_ptr_2 = args.ptr;
uint32_t reg_data_2 = READ_AND_ADVANCE_PTR();
const char* reg_name_1 = xenos::GetRegisterName(reg_index_1); const char* reg_name_1 = xenos::GetRegisterName(reg_index_1);
const char* reg_name_2 = xenos::GetRegisterName(reg_index_2); const char* reg_name_2 = xenos::GetRegisterName(reg_index_2);
XELOGGPU("[%.8X] %.8X -> %.4X %s", XELOGGPU("[%.8X] %.8X -> %.4X %s",
ptr + (n + 1) * 4, reg_ptr_1,
reg_data_1, reg_index_1, reg_name_1 ? reg_name_1 : ""); reg_data_1, reg_index_1, reg_name_1 ? reg_name_1 : "");
XELOGGPU("[%.8X] %.8X -> %.4X %s", XELOGGPU("[%.8X] %.8X -> %.4X %s",
ptr + (n + 2) * 4, reg_ptr_2,
reg_data_2, reg_index_2, reg_name_2 ? reg_name_2 : ""); reg_data_2, reg_index_2, reg_name_2 ? reg_name_2 : "");
// TODO(benvanik): exec write handler (if special). // TODO(benvanik): exec write handler (if special).
if (reg_index_1 < kXEGpuRegisterCount) { if (reg_index_1 < kXEGpuRegisterCount) {
@ -196,15 +242,13 @@ void RingBufferWorker::ExecuteSegment(uint32_t ptr, uint32_t length) {
if (reg_index_2 < kXEGpuRegisterCount) { if (reg_index_2 < kXEGpuRegisterCount) {
regs->values[reg_index_2].u32 = reg_data_2; regs->values[reg_index_2].u32 = reg_data_2;
} }
return 1 + 2;
n += 1 + 2;
} }
break; break;
case 0x02: case 0x02:
// Type-2 packet. // Type-2 packet.
// No-op. Do nothing. // No-op. Do nothing.
n++; return 1;
break;
case 0x03: case 0x03:
{ {
// Type-3 packet. // Type-3 packet.
@ -216,70 +260,72 @@ void RingBufferWorker::ExecuteSegment(uint32_t ptr, uint32_t length) {
case PM4_ME_INIT: case PM4_ME_INIT:
// initialize CP's micro-engine // initialize CP's micro-engine
XELOGGPU("[%.8X] Packet(%.8X): PM4_ME_INIT", XELOGGPU("[%.8X] Packet(%.8X): PM4_ME_INIT",
ptr + n * 4, packet); packet_ptr, packet);
LOG_DATA(count); LOG_DATA(count);
ADVANCE_PTR(count);
break; break;
case PM4_NOP: case PM4_NOP:
// skip N 32-bit words to get to the next packet // skip N 32-bit words to get to the next packet
// No-op, ignore some data. // No-op, ignore some data.
XELOGGPU("[%.8X] Packet(%.8X): PM4_NOP", XELOGGPU("[%.8X] Packet(%.8X): PM4_NOP",
ptr + n * 4, packet); packet_ptr, packet);
LOG_DATA(count); LOG_DATA(count);
ADVANCE_PTR(count);
break; break;
case PM4_INDIRECT_BUFFER: case PM4_INDIRECT_BUFFER:
// indirect buffer dispatch // indirect buffer dispatch
{ {
uint32_t list_ptr = XEGETUINT32BE(packet_base + 1 * 4); uint32_t list_ptr = READ_AND_ADVANCE_PTR();
uint32_t list_length = XEGETUINT32BE(packet_base + 2 * 4); uint32_t list_length = READ_AND_ADVANCE_PTR();
XELOGGPU("[%.8X] Packet(%.8X): PM4_INDIRECT_BUFFER %.8X (%dw)", XELOGGPU("[%.8X] Packet(%.8X): PM4_INDIRECT_BUFFER %.8X (%dw)",
ptr + n * 4, packet, list_ptr, list_length); packet_ptr, packet, list_ptr, list_length);
ExecuteSegment(list_ptr, list_length); ExecuteIndirectBuffer(list_ptr, list_length);
driver_->set_address_translation(primary_buffer_ptr_ & ~0x1FFFFFFF);
} }
break; break;
case PM4_WAIT_REG_MEM: case PM4_WAIT_REG_MEM:
// wait until a register or memory location is a specific value // wait until a register or memory location is a specific value
XELOGGPU("[%.8X] Packet(%.8X): PM4_WAIT_REG_MEM", XELOGGPU("[%.8X] Packet(%.8X): PM4_WAIT_REG_MEM",
ptr + n * 4, packet); packet_ptr, packet);
LOG_DATA(count); LOG_DATA(count);
ADVANCE_PTR(count);
break; break;
case PM4_REG_RMW: case PM4_REG_RMW:
// register read/modify/write // register read/modify/write
// ? (used during shader upload and edram setup) // ? (used during shader upload and edram setup)
XELOGGPU("[%.8X] Packet(%.8X): PM4_REG_RMW", XELOGGPU("[%.8X] Packet(%.8X): PM4_REG_RMW",
ptr + n * 4, packet); packet_ptr, packet);
LOG_DATA(count); LOG_DATA(count);
ADVANCE_PTR(count);
break; break;
case PM4_COND_WRITE: case PM4_COND_WRITE:
// conditional write to memory or register // conditional write to memory or register
XELOGGPU("[%.8X] Packet(%.8X): PM4_COND_WRITE", XELOGGPU("[%.8X] Packet(%.8X): PM4_COND_WRITE",
ptr + n * 4, packet); packet_ptr, packet);
LOG_DATA(count); LOG_DATA(count);
ADVANCE_PTR(count);
break; break;
case PM4_EVENT_WRITE: case PM4_EVENT_WRITE:
// generate an event that creates a write to memory when completed // generate an event that creates a write to memory when completed
XELOGGPU("[%.8X] Packet(%.8X): PM4_EVENT_WRITE", XELOGGPU("[%.8X] Packet(%.8X): PM4_EVENT_WRITE",
ptr + n * 4, packet); packet_ptr, packet);
LOG_DATA(count); LOG_DATA(count);
ADVANCE_PTR(count);
break; break;
case PM4_EVENT_WRITE_SHD: case PM4_EVENT_WRITE_SHD:
// generate a VS|PS_done event // generate a VS|PS_done event
{ {
XELOGGPU("[%.8X] Packet(%.8X): PM4_EVENT_WRITE_SHD", XELOGGPU("[%.8X] Packet(%.8X): PM4_EVENT_WRITE_SHD",
ptr + n * 4, packet); packet_ptr, packet);
LOG_DATA(count); LOG_DATA(count);
// 3? uint32_t d0 = READ_AND_ADVANCE_PTR(); // 3?
uint32_t d0 = XEGETUINT32BE(packet_base + 1 * 4); uint32_t d1 = READ_AND_ADVANCE_PTR(); // ptr
// ptr uint32_t d2 = READ_AND_ADVANCE_PTR(); // value?
uint32_t d1 = XEGETUINT32BE(packet_base + 2 * 4);
// value?
uint32_t d2 = XEGETUINT32BE(packet_base + 3 * 4);
XESETUINT32BE(p + TRANSLATE_ADDR(d1), d2); XESETUINT32BE(p + TRANSLATE_ADDR(d1), d2);
} }
break; break;
@ -288,11 +334,11 @@ void RingBufferWorker::ExecuteSegment(uint32_t ptr, uint32_t length) {
// initiate fetch of index buffer and draw // initiate fetch of index buffer and draw
{ {
XELOGGPU("[%.8X] Packet(%.8X): PM4_DRAW_INDX", XELOGGPU("[%.8X] Packet(%.8X): PM4_DRAW_INDX",
ptr + n * 4, packet); packet_ptr, packet);
LOG_DATA(count); LOG_DATA(count);
// d0 = viz query info // d0 = viz query info
uint32_t d0 = XEGETUINT32BE(packet_base + 1 * 4); uint32_t d0 = READ_AND_ADVANCE_PTR();
uint32_t d1 = XEGETUINT32BE(packet_base + 2 * 4); uint32_t d1 = READ_AND_ADVANCE_PTR();
uint32_t index_count = d1 >> 16; uint32_t index_count = d1 >> 16;
uint32_t prim_type = d1 & 0x3F; uint32_t prim_type = d1 & 0x3F;
uint32_t src_sel = (d1 >> 6) & 0x3; uint32_t src_sel = (d1 >> 6) & 0x3;
@ -306,9 +352,9 @@ void RingBufferWorker::ExecuteSegment(uint32_t ptr, uint32_t length) {
// draw using supplied indices in packet // draw using supplied indices in packet
{ {
XELOGGPU("[%.8X] Packet(%.8X): PM4_DRAW_INDX_2", XELOGGPU("[%.8X] Packet(%.8X): PM4_DRAW_INDX_2",
ptr + n * 4, packet); packet_ptr, packet);
LOG_DATA(count); LOG_DATA(count);
uint32_t d0 = XEGETUINT32BE(packet_base + 1 * 4); uint32_t d0 = READ_AND_ADVANCE_PTR();
uint32_t index_count = d0 >> 16; uint32_t index_count = d0 >> 16;
uint32_t prim_type = d0 & 0x3F; uint32_t prim_type = d0 & 0x3F;
uint32_t src_sel = (d0 >> 6) & 0x3; uint32_t src_sel = (d0 >> 6) & 0x3;
@ -323,12 +369,12 @@ void RingBufferWorker::ExecuteSegment(uint32_t ptr, uint32_t length) {
// load sequencer instruction memory (pointer-based) // load sequencer instruction memory (pointer-based)
{ {
XELOGGPU("[%.8X] Packet(%.8X): PM4_IM_LOAD", XELOGGPU("[%.8X] Packet(%.8X): PM4_IM_LOAD",
ptr + n * 4, packet); packet_ptr, packet);
LOG_DATA(count); LOG_DATA(count);
uint32_t addr_type = XEGETUINT32BE(packet_base + 1 * 4); uint32_t addr_type = READ_AND_ADVANCE_PTR();
uint32_t type = addr_type & 0x3; uint32_t type = addr_type & 0x3;
uint32_t addr = addr_type & ~0x3; uint32_t addr = addr_type & ~0x3;
uint32_t start_size = XEGETUINT32BE(packet_base + 2 * 4); uint32_t start_size = READ_AND_ADVANCE_PTR();
uint32_t start = start_size >> 16; uint32_t start = start_size >> 16;
uint32_t size = start_size & 0xFFFF; // dwords uint32_t size = start_size & 0xFFFF; // dwords
XEASSERT(start == 0); XEASSERT(start == 0);
@ -343,18 +389,21 @@ void RingBufferWorker::ExecuteSegment(uint32_t ptr, uint32_t length) {
// load sequencer instruction memory (code embedded in packet) // load sequencer instruction memory (code embedded in packet)
{ {
XELOGGPU("[%.8X] Packet(%.8X): PM4_IM_LOAD_IMMEDIATE", XELOGGPU("[%.8X] Packet(%.8X): PM4_IM_LOAD_IMMEDIATE",
ptr + n * 4, packet); packet_ptr, packet);
uint32_t type = XEGETUINT32BE(packet_base + 1 * 4); LOG_DATA(count);
uint32_t start_size = XEGETUINT32BE(packet_base + 2 * 4); uint32_t type = READ_AND_ADVANCE_PTR();
uint32_t start_size = READ_AND_ADVANCE_PTR();
uint32_t start = start_size >> 16; uint32_t start = start_size >> 16;
uint32_t size = start_size & 0xFFFF; // dwords uint32_t size = start_size & 0xFFFF; // dwords
XEASSERT(start == 0); XEASSERT(start == 0);
LOG_DATA(count); // TODO(benvanik): figure out if this could wrap.
XEASSERT(args.ptr + size * 4 < args.max_address);
driver_->SetShader( driver_->SetShader(
(XE_GPU_SHADER_TYPE)type, (XE_GPU_SHADER_TYPE)type,
ptr + n * 4 + 3 * 4, args.ptr,
start, start,
size * 4); size * 4);
ADVANCE_PTR(size);
} }
break; break;
@ -362,23 +411,25 @@ void RingBufferWorker::ExecuteSegment(uint32_t ptr, uint32_t length) {
// selective invalidation of state pointers // selective invalidation of state pointers
{ {
XELOGGPU("[%.8X] Packet(%.8X): PM4_INVALIDATE_STATE", XELOGGPU("[%.8X] Packet(%.8X): PM4_INVALIDATE_STATE",
ptr + n * 4, packet); packet_ptr, packet);
LOG_DATA(count); LOG_DATA(count);
uint32_t mask = XEGETUINT32BE(packet_base + 1 * 4); uint32_t mask = READ_AND_ADVANCE_PTR();
driver_->InvalidateState(mask); driver_->InvalidateState(mask);
} }
break; break;
default: default:
XELOGGPU("[%.8X] Packet(%.8X): unknown!", XELOGGPU("[%.8X] Packet(%.8X): unknown!",
ptr + n * 4, packet); packet_ptr, packet);
LOG_DATA(count); LOG_DATA(count);
ADVANCE_PTR(count);
break; break;
} }
n += 1 + count; return 1 + count;
} }
break; break;
} }
}
return 0;
} }

View File

@ -35,8 +35,17 @@ public:
void Pump(); void Pump();
protected: private:
void ExecuteSegment(uint32_t ptr, uint32_t length); typedef struct {
uint32_t ptr;
uint32_t base_ptr;
uint32_t max_address;
uint32_t ptr_mask;
} PacketArgs;
void AdvancePtr(PacketArgs& args, uint32_t n);
void ExecutePrimaryBuffer(uint32_t start_index, uint32_t end_index);
void ExecuteIndirectBuffer(uint32_t ptr, uint32_t length);
uint32_t ExecutePacket(PacketArgs& args);
protected: protected:
xe_memory_ref memory_; xe_memory_ref memory_;
@ -52,6 +61,7 @@ protected:
HANDLE write_ptr_index_event_; HANDLE write_ptr_index_event_;
volatile uint32_t write_ptr_index_; volatile uint32_t write_ptr_index_;
volatile uint32_t write_ptr_max_index_;
}; };