From 6547fa17487756599ef479abc9103500bb97499e Mon Sep 17 00:00:00 2001 From: Joel Linn Date: Wed, 24 Jun 2020 16:45:55 +0200 Subject: [PATCH] [APU] Rewrite XMA packet parser Use new FFmpeg frame decoder --- src/xenia/apu/xma_context.cc | 691 ++++++++++++++++++++--------------- src/xenia/apu/xma_context.h | 103 +++--- src/xenia/apu/xma_helpers.h | 15 +- 3 files changed, 460 insertions(+), 349 deletions(-) diff --git a/src/xenia/apu/xma_context.cc b/src/xenia/apu/xma_context.cc index 0ef27de25..e9415211c 100644 --- a/src/xenia/apu/xma_context.cc +++ b/src/xenia/apu/xma_context.cc @@ -25,8 +25,6 @@ extern "C" { #include "third_party/FFmpeg/libavcodec/avcodec.h" #include "third_party/FFmpeg/libavcodec/wma.h" #pragma warning(pop) - -extern AVCodec ff_xma2_decoder; } // extern "C" // Credits for most of this code goes to: @@ -38,18 +36,18 @@ namespace apu { XmaContext::XmaContext() = default; XmaContext::~XmaContext() { - if (context_) { - if (avcodec_is_open(context_)) { - avcodec_close(context_); + if (av_context_) { + if (avcodec_is_open(av_context_)) { + avcodec_close(av_context_); } - av_free(context_); + av_free(av_context_); } - if (decoded_frame_) { - av_frame_free(&decoded_frame_); - } - if (current_frame_) { - delete[] current_frame_; + if (av_frame_) { + av_frame_free(&av_frame_); } + // if (current_frame_) { + // delete[] current_frame_; + // } } int XmaContext::Setup(uint32_t id, Memory* memory, uint32_t guest_ptr) { @@ -57,46 +55,34 @@ int XmaContext::Setup(uint32_t id, Memory* memory, uint32_t guest_ptr) { memory_ = memory; guest_ptr_ = guest_ptr; - // Allocate important stuff. - codec_ = &ff_xma2_decoder; - if (!codec_) { + // Allocate ffmpeg stuff: + av_packet_ = av_packet_alloc(); + assert_not_null(av_packet_); + + // find the XMA2 audio decoder + av_codec_ = avcodec_find_decoder(AV_CODEC_ID_XMAFRAMES); + if (!av_codec_) { + XELOGE("XmaContext {}: Codec not found", id); return 1; } - context_ = avcodec_alloc_context3(codec_); - if (!context_) { + av_context_ = avcodec_alloc_context3(av_codec_); + if (!av_context_) { + XELOGE("XmaContext {}: Couldn't allocate context", id); return 1; } - decoded_frame_ = av_frame_alloc(); - if (!decoded_frame_) { - return 1; - } - - packet_ = new AVPacket(); - av_init_packet(packet_); - // Initialize these to 0. They'll actually be set later. - context_->channels = 0; - context_->sample_rate = 0; - context_->block_align = kBytesPerPacket; + av_context_->channels = 0; + av_context_->sample_rate = 0; - // Extra data passed to the decoder. - std::memset(&extra_data_, 0, sizeof(extra_data_)); - extra_data_.bits_per_sample = 16; - extra_data_.channel_mask = AV_CH_FRONT_RIGHT; - extra_data_.decode_flags = 0x10D6; + av_frame_ = av_frame_alloc(); + if (!av_frame_) { + XELOGE("XmaContext {}: Couldn't allocate frame", id); + return 1; + } - context_->extradata_size = sizeof(extra_data_); - context_->extradata = reinterpret_cast(&extra_data_); - - partial_frame_buffer_.resize(2048); - - // Current frame stuff whatever - // samples per frame * 2 max channels * output bytes - current_frame_ = new uint8_t[kSamplesPerFrame * kBytesPerSample * 2]; - - // FYI: We're purposely not opening the context here. That is done later. + // FYI: We're purposely not opening the codec here. That is done later. return 0; } @@ -110,7 +96,7 @@ bool XmaContext::Work() { auto context_ptr = memory()->TranslateVirtual(guest_ptr()); XMA_CONTEXT_DATA data(context_ptr); - DecodePackets(&data); + Decode(&data); data.Store(context_ptr); return true; } @@ -125,7 +111,7 @@ void XmaContext::Enable() { data.current_buffer, data.input_buffer_read_offset, (data.current_buffer == 0 ? data.input_buffer_0_packet_count : data.input_buffer_1_packet_count) * - kBytesPerPacket * 8); + kBitsPerPacket); data.Store(context_ptr); @@ -176,6 +162,31 @@ void XmaContext::Release() { std::memset(context_ptr, 0, sizeof(XMA_CONTEXT_DATA)); // Zero it. } +void XmaContext::SwapInputBuffer(XMA_CONTEXT_DATA* data) { + // No more frames. + if (data->current_buffer == 0) { + data->input_buffer_0_valid = 0; + } else { + data->input_buffer_1_valid = 0; + } + data->current_buffer ^= 1; + data->input_buffer_read_offset = 0; +} + +/* +void XmaContext::NextPacket( + uint8_t* input_buffer, + uint32_t input_size, + uint32_t input_buffer_read_offset) { +*/ +void XmaContext::NextPacket(XMA_CONTEXT_DATA* data) { + // auto packet_idx = GetFramePacketNumber(input_buffer, input_size, + // input_buffer_read_offset); + + // packet_idx++; + // if (packet_idx++ >= input_size) +} + int XmaContext::GetSampleRate(int id) { switch (id) { case 0: @@ -191,38 +202,6 @@ int XmaContext::GetSampleRate(int id) { return 0; } -size_t XmaContext::SavePartial(uint8_t* packet, uint32_t frame_offset_bits, - size_t frame_size_bits, bool append) { - uint8_t* buff = partial_frame_buffer_.data(); - - BitStream stream(packet, 2048 * 8); - stream.SetOffset(frame_offset_bits); - - if (!append) { - // Reset the buffer. - // TODO: Probably not necessary. - std::memset(buff, 0, partial_frame_buffer_.size()); - - size_t copy_bits = (2048 * 8) - frame_offset_bits; - size_t copy_offset = stream.Copy(buff, copy_bits); - partial_frame_offset_bits_ = copy_bits; - partial_frame_start_offset_bits_ = copy_offset; - - return copy_bits; - } else { - size_t copy_bits = frame_size_bits - partial_frame_offset_bits_; - size_t copy_offset = stream.Copy( - buff + - ((partial_frame_offset_bits_ + partial_frame_start_offset_bits_) / - 8), - copy_bits); - - partial_frame_offset_bits_ += copy_bits; - - return copy_bits; - } -} - bool XmaContext::ValidFrameOffset(uint8_t* block, size_t size_bytes, size_t frame_offset_bits) { uint32_t packet_num = @@ -233,15 +212,15 @@ bool XmaContext::ValidFrameOffset(uint8_t* block, size_t size_bytes, } uint8_t* packet = block + (packet_num * kBytesPerPacket); - size_t relative_offset_bits = frame_offset_bits % (kBytesPerPacket * 8); + size_t relative_offset_bits = frame_offset_bits % kBitsPerPacket; uint32_t first_frame_offset = xma::GetPacketFrameOffset(packet); - if (first_frame_offset == -1 || first_frame_offset > kBytesPerPacket * 8) { + if (first_frame_offset == -1 || first_frame_offset > kBitsPerPacket) { // Packet only contains a partial frame, so no frames can start here. return false; } - BitStream stream(packet, kBytesPerPacket * 8); + BitStream stream(packet, kBitsPerPacket); stream.SetOffset(first_frame_offset); while (true) { if (stream.offset_bits() == relative_offset_bits) { @@ -273,7 +252,21 @@ bool XmaContext::ValidFrameOffset(uint8_t* block, size_t size_bytes, return false; } -void XmaContext::DecodePackets(XMA_CONTEXT_DATA* data) { +static void dump_raw(AVFrame* frame, int id) { + FILE* outfile = fopen(fmt::format("out{}.raw", id).c_str(), "ab"); + if (!outfile) { + return; + } + size_t data_size = sizeof(float); + for (int i = 0; i < frame->nb_samples; i++) { + for (int ch = 0; ch < frame->channels; ch++) { + fwrite(frame->data[ch] + data_size * i, 1, data_size, outfile); + } + } + fclose(outfile); +} + +void XmaContext::Decode(XMA_CONTEXT_DATA* data) { SCOPE_profile_cpu_f("apu"); // What I see: @@ -345,49 +338,48 @@ void XmaContext::DecodePackets(XMA_CONTEXT_DATA* data) { // to the read offset. uint8_t* output_buffer = memory()->TranslatePhysical(data->output_buffer_ptr); uint32_t output_capacity = - data->output_buffer_block_count * kBytesPerSubframe; + data->output_buffer_block_count * kBytesPerSubframeChannel; uint32_t output_read_offset = - data->output_buffer_read_offset * kBytesPerSubframe; + data->output_buffer_read_offset * kBytesPerSubframeChannel; uint32_t output_write_offset = - data->output_buffer_write_offset * kBytesPerSubframe; + data->output_buffer_write_offset * kBytesPerSubframeChannel; RingBuffer output_rb(output_buffer, output_capacity); output_rb.set_read_offset(output_read_offset); output_rb.set_write_offset(output_write_offset); + int num_channels = data->is_stereo ? 2 : 1; + // We can only decode an entire frame and write it out at a time, so // don't save any samples. + // TODO(JoelLinn): subframes when looping size_t output_remaining_bytes = output_rb.write_count(); - output_remaining_bytes -= data->is_stereo ? (output_remaining_bytes % 2048) - : (output_remaining_bytes % 1024); + output_remaining_bytes -= + output_remaining_bytes % (kBytesPerFrameChannel * num_channels); + // is_dirty_ = true; // TODO + // is_dirty_ = false; // TODO + static int total_samples = 0; // Decode until we can't write any more data. while (output_remaining_bytes > 0) { - int num_channels = data->is_stereo ? 2 : 1; if (!data->input_buffer_0_valid && !data->input_buffer_1_valid) { // Out of data. break; } + assert_true(packets_skip_ == 0); + assert_true(split_frame_len_ == 0); + assert_true(split_frame_len_partial_ == 0); + if (data->input_buffer_read_offset == 0) { // Invalid offset. Go ahead and set it. - uint32_t offset = xma::GetPacketFrameOffset(current_input_buffer); + auto offset = xma::GetPacketFrameOffset(current_input_buffer); if (offset == -1) { // No more frames. - if (data->current_buffer == 0) { - data->input_buffer_0_valid = 0; - data->input_buffer_read_offset = 0; - data->current_buffer++; - } else if (data->current_buffer == 1) { - data->input_buffer_1_valid = 0; - data->input_buffer_read_offset = 0; - data->current_buffer--; - } - - // Die if we have no partial saved. - if (!partial_frame_saved_) { - return; - } + SwapInputBuffer(data); + // TODO partial frames? end? + assert_always("TODO"); + return; } else { data->input_buffer_read_offset = offset; } @@ -397,205 +389,191 @@ void XmaContext::DecodePackets(XMA_CONTEXT_DATA* data) { data->input_buffer_read_offset)) { XELOGAPU("XmaContext {}: Invalid read offset {}!", id(), data->input_buffer_read_offset); - if (data->current_buffer == 0) { - data->current_buffer = 1; - data->input_buffer_0_valid = 0; - } else if (data->current_buffer == 1) { - data->current_buffer = 0; - data->input_buffer_1_valid = 0; - } - - data->input_buffer_read_offset = 0; + SwapInputBuffer(data); return; } - // Check if we need to save a partial frame. - if (data->input_buffer_read_offset != 0 && !partial_frame_saved_ && - GetFramePacketNumber(current_input_buffer, current_input_size, - data->input_buffer_read_offset) == - current_input_packet_count - 1) { - BitStream stream(current_input_buffer, current_input_size * 8); - stream.SetOffset(data->input_buffer_read_offset); + // Where are we in the buffer (in XMA jargon) + auto [packet_idx, frame_idx] = + GetFrameNumber(current_input_buffer, current_input_size, + data->input_buffer_read_offset); + // TODO handle + assert_true(packet_idx >= 0); + assert_true(frame_idx >= 0); + auto packet = current_input_buffer + packet_idx * kBytesPerPacket; + // frames that belong to this packet + auto [frame_count, frame_last_split] = GetPacketFrameCount(packet); + assert_true(frame_count >= 0); // TODO end + // Current frame is split to next packet: + bool frame_is_split = frame_last_split && (frame_idx >= frame_count - 1); - if (stream.BitsRemaining() >= 15) { - uint64_t frame_size = stream.Read(15); - if (data->input_buffer_read_offset + frame_size >= - current_input_size * 8 && - frame_size != 0x7FFF) { - uint32_t rel_offset = data->input_buffer_read_offset % (2048 * 8); + PrepareDecoder(packet, data->sample_rate, num_channels); - // Frame is cut off! Save and exit. - partial_frame_saved_ = true; - partial_frame_size_known_ = true; - partial_frame_total_size_bits_ = frame_size; - SavePartial( - current_input_buffer + (current_input_packet_count - 1) * 2048, - rel_offset, frame_size, false); - } - } else { - // Header cut in half :/ - uint32_t rel_offset = data->input_buffer_read_offset % (2048 * 8); - - partial_frame_saved_ = true; - partial_frame_size_known_ = false; - SavePartial( - current_input_buffer + (current_input_packet_count - 1) * 2048, - rel_offset, 0, false); - } - - if (partial_frame_saved_) { - XELOGAPU("XmaContext {}: saved a partial frame", id()); - - if (data->current_buffer == 0) { - data->input_buffer_0_valid = 0; - data->input_buffer_read_offset = 0; - data->current_buffer++; - } else if (data->current_buffer == 1) { - data->input_buffer_1_valid = 0; - data->input_buffer_read_offset = 0; - data->current_buffer--; - } - - return; - } - } - - if (partial_frame_saved_ && !partial_frame_size_known_) { - // Append the rest of the header. - size_t offset = SavePartial(current_input_buffer, 32, 15, true); - - // Read the frame size. - BitStream stream(partial_frame_buffer_.data(), - 15 + partial_frame_start_offset_bits_); - stream.SetOffset(partial_frame_start_offset_bits_); - - uint64_t size = stream.Read(15); - partial_frame_size_known_ = true; - partial_frame_total_size_bits_ = size; - - // Now append the rest of the frame. - SavePartial(current_input_buffer, 32 + (uint32_t)offset, size, true); - } else if (partial_frame_saved_) { - // Append the rest of the frame. - SavePartial(current_input_buffer, 32, partial_frame_total_size_bits_, - true); - } - - // Prepare the decoder. Reinitialize if any parameters have changed. - PrepareDecoder(current_input_buffer, current_input_size, data->sample_rate, - num_channels); - - bool partial = false; - size_t bit_offset = data->input_buffer_read_offset; - if (partial_frame_saved_) { - XELOGAPU("XmaContext {}: processing saved partial frame", id()); - packet_->data = partial_frame_buffer_.data(); - packet_->size = (int)partial_frame_buffer_.size(); - - bit_offset = partial_frame_start_offset_bits_; - partial = true; - partial_frame_saved_ = false; + BitStream stream(current_input_buffer, (packet_idx + 1) * kBitsPerPacket); + stream.SetOffset(data->input_buffer_read_offset); + int frame_len; + int frame_len_partial = static_cast(stream.BitsRemaining()); + if (frame_len_partial >= 15) { + frame_len = static_cast(stream.Peek(15)); } else { - packet_->data = current_input_buffer; - packet_->size = (int)current_input_size; + // assert_always(); + frame_len = xma::kMaxFrameLength + 1; + } + assert_true(frame_is_split == (frame_len > frame_len_partial)); + + // TODO fix bitstream copy + std::memset(xma_frame_.data(), 0, xma_frame_.size()); + + auto padding_start = stream.Copy(xma_frame_.data() + 1, + std::min(frame_len, frame_len_partial)); + assert_true(padding_start < 8); + + if (frame_is_split) { + // go to next xma packet of this stream + // for (auto skip = xma::GetPacketSkipCount(packet) + 1; skip > 0; skip--) + auto skip = xma::GetPacketSkipCount(packet) + 1; + do { + packet += kBytesPerPacket; + packet_idx++; + if (packet_idx >= current_input_packet_count) { + packets_skip_ = skip; + split_frame_len_ = frame_len; + split_frame_len_partial_ = frame_len_partial; + SwapInputBuffer(data); + return; + } + skip--; + /* + if (skip == 0) { + std::tie(frame_count, frame_last_split) = GetPacketFrameCount(packet); + if (frame_count == 0) { + skip = xma::GetPacketSkipCount(packet) + 1; + } + } + */ + } while (skip > 0); + std::tie(frame_count, frame_last_split) = GetPacketFrameCount(packet); + frame_idx = -1; + + stream = + BitStream(current_input_buffer, (packet_idx + 1) * kBitsPerPacket); + stream.SetOffset(packet_idx * kBitsPerPacket + 32); + + if (frame_len > xma::kMaxFrameLength) { + // TODO write CopyPeekMethod + auto offset = stream.offset_bits(); + stream.Copy( + xma_frame_.data() + 1 + ((frame_len_partial + padding_start) / 8), + 15 - frame_len_partial); + stream.SetOffset(offset); + BitStream slen(xma_frame_.data() + 1, 15 + padding_start); + slen.Advance(padding_start); + frame_len = static_cast(slen.Read(15)); + } + + if (frame_count > 0) { + assert_true(xma::GetPacketFrameOffset(packet) - 32 == + frame_len - frame_len_partial); + } + + auto offset = stream.Copy( + xma_frame_.data() + 1 + ((frame_len_partial + padding_start) / 8), + frame_len - frame_len_partial); + assert_true(offset == (padding_start + frame_len_partial) % 8); } - int invalid_frame = 0; // invalid frame? - int got_frame = 0; // successfully decoded a frame? - int frame_size = 0; - int len = - xma2_decode_frame(context_, packet_, decoded_frame_, &got_frame, - &invalid_frame, &frame_size, !partial, bit_offset); - if (!partial && len == 0) { - // Got the last frame of a packet. Advance the read offset to the next - // packet. - uint32_t packet_number = - GetFramePacketNumber(current_input_buffer, current_input_size, - data->input_buffer_read_offset); - if (packet_number == current_input_packet_count - 1) { - // Last packet. - if (data->current_buffer == 0) { - data->input_buffer_0_valid = 0; - data->input_buffer_read_offset = 0; - data->current_buffer = 1; - } else if (data->current_buffer == 1) { - data->input_buffer_1_valid = 0; - data->input_buffer_read_offset = 0; - data->current_buffer = 0; - } - } else { - // Advance the read offset. - packet_number++; - uint8_t* packet = current_input_buffer + (packet_number * 2048); - uint32_t first_frame_offset = xma::GetPacketFrameOffset(packet); - if (first_frame_offset == -1) { - // Invalid packet (only contained a frame partial). Out of input. + av_packet_->data = xma_frame_.data(); + av_packet_->size = + static_cast(1 + ((padding_start + frame_len) / 8) + + (((padding_start + frame_len) % 8) ? 1 : 0)); + + auto padding_end = av_packet_->size * 8 - (8 + padding_start + frame_len); + assert_true(padding_end < 8); + xma_frame_[0] = ((padding_start & 7) << 5) | ((padding_end & 7) << 2); + + auto ret = avcodec_send_packet(av_context_, av_packet_); + if (ret < 0) { + XELOGE("XmaContext {}: Error sending packet for decoding", id()); + // TODO bail out + assert_always(); + } + + ret = avcodec_receive_frame(av_context_, av_frame_); + /* + if (ret == AVERROR(EAGAIN) || ret == AVERROR_EOF) + // TODO AVERROR_EOF??? + break; + else + */ + if (ret < 0) { + XELOGE("XmaContext {}: Error during decoding", id()); + assert_always(); + return; // TODO bail out + } + assert_true(ret == 0); + + { + // copy over 1 frame + // update input buffer read offset + + // assert(decoded_consumed_samples_ + kSamplesPerFrame <= + // current_frame_.size()); + assert_true(av_context_->sample_fmt == AV_SAMPLE_FMT_FLTP); + // assert_true(frame_is_split == (frame_idx == -1)); + + // dump_raw(av_frame_, id()); + ConvertFrame((const uint8_t**)av_frame_->data, num_channels, + kSamplesPerFrame, raw_frame_.data()); + // decoded_consumed_samples_ += kSamplesPerFrame; + + auto byte_count = kBytesPerFrameChannel * num_channels; + assert_true(output_remaining_bytes >= byte_count); + output_rb.Write(raw_frame_.data(), byte_count); + output_remaining_bytes -= byte_count; + data->output_buffer_write_offset = output_rb.write_offset() / 256; + + total_samples += id_ == 0 ? kSamplesPerFrame : 0; + + size_t offset = data->input_buffer_read_offset; + // if (offset % (kBytesPerSample * 8) == 0) { + // offset = xma::GetPacketFrameOffset(packet); + // } + offset = GetNextFrame(current_input_buffer, current_input_size, offset); + // assert_true((offset == 0) == + // (frame_is_split || (frame_idx + 1 >= frame_count))); + if (frame_idx + 1 >= frame_count) { + // Next packet + auto skip = xma::GetPacketSkipCount(packet) + 1; + packet += skip * kBytesPerPacket; + packet_idx += skip; + // Next packet + if (packet_idx >= current_input_packet_count) { + // Buffer is fully used if (data->current_buffer == 0) { data->input_buffer_0_valid = 0; - data->current_buffer = 1; - } else if (data->current_buffer == 1) { + } else { data->input_buffer_1_valid = 0; - data->current_buffer = 0; } - + data->current_buffer ^= 1; data->input_buffer_read_offset = 0; - } else { - data->input_buffer_read_offset = - packet_number * 2048 * 8 + first_frame_offset; + break; } + // offset = packet_idx * kBitsPerPacket; + offset = + xma::GetPacketFrameOffset(packet) + packet_idx * kBitsPerPacket; } - } - - if (got_frame) { - // Valid frame. - // Check and see if we need to loop back to any spot. - if (data->loop_count > 0 && - data->input_buffer_read_offset == data->loop_end) { - // Loop back to the beginning. - data->input_buffer_read_offset = data->loop_start; - if (data->loop_count < 255) { - data->loop_count--; + if (offset == 0) { + // Next packet + if (packet_idx >= current_input_packet_count) { + // Buffer is fully used + SwapInputBuffer(data); + break; } - } else if (!partial && len > 0) { - data->input_buffer_read_offset += len; + offset = + xma::GetPacketFrameOffset(packet) + packet_idx * kBitsPerPacket; } - } else if (len < 0) { - // Did not get frame - XELOGAPU("FFmpeg failed to decode a frame!"); - if (frame_size && frame_size != 0x7FFF) { - data->input_buffer_read_offset += frame_size; - } else { - data->input_buffer_0_valid = 0; - data->input_buffer_1_valid = 0; - } - return; - } - - if (got_frame) { - // Successfully decoded a frame. - // Copy to the output buffer. - size_t written_bytes = 0; - - // Validity checks. - assert(decoded_frame_->nb_samples <= kSamplesPerFrame); - assert(context_->sample_fmt == AV_SAMPLE_FMT_FLTP); - - // Check the returned buffer size. - assert(av_samples_get_buffer_size(NULL, context_->channels, - decoded_frame_->nb_samples, - context_->sample_fmt, 1) == - context_->channels * decoded_frame_->nb_samples * sizeof(float)); - - // Convert the frame. - ConvertFrame((const uint8_t**)decoded_frame_->data, context_->channels, - decoded_frame_->nb_samples, current_frame_); - - assert_true(output_remaining_bytes >= kBytesPerFrame * num_channels); - output_rb.Write(current_frame_, kBytesPerFrame * num_channels); - written_bytes = kBytesPerFrame * num_channels; - - output_remaining_bytes -= written_bytes; - data->output_buffer_write_offset = output_rb.write_offset() / 256; + // TODO buffer bounds check + data->input_buffer_read_offset = offset; } } @@ -606,8 +584,51 @@ void XmaContext::DecodePackets(XMA_CONTEXT_DATA* data) { } } -uint32_t XmaContext::GetFramePacketNumber(uint8_t* block, size_t size, - size_t bit_offset) { +size_t XmaContext::GetNextFrame(uint8_t* block, size_t size, + size_t bit_offset) { + // offset = xma::GetPacketFrameOffset(packet); + // TODO meh + // auto next_packet = bit_offset - bit_offset % kBitsPerPacket + + // kBitsPerPacket; + auto packet_idx = GetFramePacketNumber(block, size, bit_offset); + + BitStream stream(block, size * 8); + stream.SetOffset(bit_offset); + + if (stream.BitsRemaining() < 15) { + return 0; + } + + uint64_t len = stream.Read(15); + if ((len - 15) > stream.BitsRemaining()) { + assert_always("TODO"); + // *bit_offset = next_packet; + // return false; + // return next_packet; + return 0; + } else if (len == 0x7FFF) { + assert_always("TODO"); + // *bit_offset = next_packet; + // return false; + return 0; + // return next_packet; + } + + stream.Advance(len - (15 + 1)); + // Read the trailing bit to see if frames follow + if (stream.Read(1) == 0) { + return 0; + } + + bit_offset += len; + if (packet_idx < GetFramePacketNumber(block, size, bit_offset)) { + return 0; + } + return bit_offset; +} + +int XmaContext::GetFramePacketNumber(uint8_t* block, size_t size, + size_t bit_offset) { size *= 8; if (bit_offset >= size) { // Not good :( @@ -621,32 +642,104 @@ uint32_t XmaContext::GetFramePacketNumber(uint8_t* block, size_t size, return (uint32_t)packet_number; } -int XmaContext::PrepareDecoder(uint8_t* block, size_t size, int sample_rate, - int channels) { +std::tuple XmaContext::GetFrameNumber(uint8_t* block, size_t size, + size_t bit_offset) { + auto packet_idx = GetFramePacketNumber(block, size, bit_offset); + + if (packet_idx < 0 || (packet_idx + 1) * kBytesPerPacket > size) { + return {packet_idx, -1}; + } + + uint8_t* packet = block + (packet_idx * kBytesPerPacket); + auto first_frame_offset = xma::GetPacketFrameOffset(packet); + BitStream stream(block, size * 8); + stream.SetOffset(packet_idx * kBitsPerPacket + first_frame_offset); + + int frame_idx = 0; + while (true) { + if (stream.BitsRemaining() < 15) { + return {packet_idx, -1}; + } + + if (stream.offset_bits() == bit_offset) { + break; + } + + uint64_t size = stream.Read(15); + if ((size - 15) > stream.BitsRemaining()) { + // Last frame. + break; + } else if (size == 0x7FFF) { + // Invalid frame (and last of this packet) + break; + } + + stream.Advance(size - (15 + 1)); + + // Read the trailing bit to see if frames follow + if (stream.Read(1) == 0) { + break; + } + frame_idx++; + } + return {packet_idx, frame_idx}; +} + +std::tuple XmaContext::GetPacketFrameCount(uint8_t* packet) { + auto first_frame_offset = xma::GetPacketFrameOffset(packet); + if (first_frame_offset > kBitsPerPacket - kBitsPerHeader) { + // frame offset is beyond packet end + return {0, false}; + } + + BitStream stream(packet, kBitsPerPacket); + stream.SetOffset(first_frame_offset); + int frame_count = 0; + + while (true) { + frame_count++; + if (stream.BitsRemaining() < 15) { + return {frame_count, true}; + } + + uint64_t size = stream.Read(15); + if ((size - 15) > stream.BitsRemaining()) { + return {frame_count, true}; + } else if (size == 0x7FFF) { + assert_always(); + return {frame_count, true}; + } + + stream.Advance(size - (15 + 1)); + + if (stream.Read(1) == 0) { + return {frame_count, false}; + } + } +} + +int XmaContext::PrepareDecoder(uint8_t* packet, int sample_rate, int channels) { // Sanity check: Packet metadata is always 1 for XMA2/0 for XMA - assert_true((block[2] & 0x7) == 1 || (block[2] & 0x7) == 0); + assert_true((packet[2] & 0x7) == 1 || (packet[2] & 0x7) == 0); sample_rate = GetSampleRate(sample_rate); // Re-initialize the context with new sample rate and channels. - if (context_->sample_rate != sample_rate || context_->channels != channels) { + if (av_context_->sample_rate != sample_rate || + av_context_->channels != channels) { // We have to reopen the codec so it'll realloc whatever data it needs. // TODO(DrChat): Find a better way. - avcodec_close(context_); + avcodec_close(av_context_); - context_->sample_rate = sample_rate; - context_->channels = channels; - extra_data_.channel_mask = - channels == 2 ? AV_CH_LAYOUT_STEREO : AV_CH_LAYOUT_MONO; + av_context_->sample_rate = sample_rate; + av_context_->channels = channels; - if (avcodec_open2(context_, codec_, NULL) < 0) { + if (avcodec_open2(av_context_, av_codec_, NULL) < 0) { XELOGE("XmaContext: Failed to reopen FFmpeg context"); - return 1; + return -1; } + return 1; } - - av_frame_unref(decoded_frame_); - return 0; } diff --git a/src/xenia/apu/xma_context.h b/src/xenia/apu/xma_context.h index d800bc0a6..114a8c388 100644 --- a/src/xenia/apu/xma_context.h +++ b/src/xenia/apu/xma_context.h @@ -2,7 +2,7 @@ ****************************************************************************** * Xenia : Xbox 360 Emulator Research Project * ****************************************************************************** - * Copyright 2015 Ben Vanik. All rights reserved. * + * Copyright 2021 Ben Vanik. All rights reserved. * * Released under the BSD license - see LICENSE in the root for more details. * ****************************************************************************** */ @@ -10,10 +10,11 @@ #ifndef XENIA_APU_XMA_CONTEXT_H_ #define XENIA_APU_XMA_CONTEXT_H_ +#include #include #include #include -#include +//#include #include "xenia/memory.h" #include "xenia/xbox.h" @@ -30,6 +31,7 @@ // Forward declarations struct AVCodec; +struct AVCodecParserContext; struct AVCodecContext; struct AVFrame; struct AVPacket; @@ -121,29 +123,29 @@ struct XMA_CONTEXT_DATA { static_assert_size(XMA_CONTEXT_DATA, 64); #pragma pack(push, 1) -struct WmaProExtraData { - uint16_t bits_per_sample; - uint32_t channel_mask; - uint8_t unk06[8]; - uint16_t decode_flags; - uint8_t unk10[2]; +// XMA2WAVEFORMATEX +struct Xma2ExtraData { + uint8_t raw[34]; }; -static_assert_size(WmaProExtraData, 18); +static_assert_size(Xma2ExtraData, 34); #pragma pack(pop) class XmaContext { public: static const uint32_t kBytesPerPacket = 2048; + static const uint32_t kBitsPerPacket = kBytesPerPacket * 8; + static const uint32_t kBitsPerHeader = 33; static const uint32_t kBytesPerSample = 2; static const uint32_t kSamplesPerFrame = 512; static const uint32_t kSamplesPerSubframe = 128; - static const uint32_t kBytesPerFrame = kSamplesPerFrame * kBytesPerSample; - static const uint32_t kBytesPerSubframe = + static const uint32_t kBytesPerFrameChannel = + kSamplesPerFrame * kBytesPerSample; + static const uint32_t kBytesPerSubframeChannel = kSamplesPerSubframe * kBytesPerSample; - static const uint32_t kOutputBytesPerBlock = 256; - static const uint32_t kOutputMaxSizeBytes = 31 * kOutputBytesPerBlock; + // static const uint32_t kOutputBytesPerBlock = 256; + // static const uint32_t kOutputMaxSizeBytes = 31 * kOutputBytesPerBlock; explicit XmaContext(); ~XmaContext(); @@ -168,28 +170,29 @@ class XmaContext { void set_is_enabled(bool is_enabled) { is_enabled_ = is_enabled; } private: + static void SwapInputBuffer(XMA_CONTEXT_DATA* data); + static void NextPacket(XMA_CONTEXT_DATA* data); static int GetSampleRate(int id); + // Get the offset of the next frame. Does not traverse packets. + static size_t GetNextFrame(uint8_t* block, size_t size, size_t bit_offset); + // Get the containing packet number of the frame pointed to by the offset. + static int GetFramePacketNumber(uint8_t* block, size_t size, + size_t bit_offset); + // Get the packet number and the index of the frame inside that packet + static std::tuple GetFrameNumber(uint8_t* block, size_t size, + size_t bit_offset); + // Get the number of frames contained in the packet (including truncated) and + // if the last frame is split. + static std::tuple GetPacketFrameCount(uint8_t* packet); + + // Convert sample format and swap bytes + static bool ConvertFrame(const uint8_t** samples, int num_channels, + int num_samples, uint8_t* output_buffer); - size_t SavePartial(uint8_t* packet, uint32_t frame_offset_bits, - size_t frame_size_bits, bool append); bool ValidFrameOffset(uint8_t* block, size_t size_bytes, size_t frame_offset_bits); - void DecodePackets(XMA_CONTEXT_DATA* data); - uint32_t GetFramePacketNumber(uint8_t* block, size_t size, size_t bit_offset); - int PrepareDecoder(uint8_t* block, size_t size, int sample_rate, - int channels); - - bool ConvertFrame(const uint8_t** samples, int num_channels, int num_samples, - uint8_t* output_buffer); - - int StartPacket(XMA_CONTEXT_DATA* data); - - int PreparePacket(uint8_t* input, size_t seq_offset, size_t size, - int sample_rate, int channels); - void DiscardPacket(); - - int DecodePacket(uint8_t* output, size_t offset, size_t size, - size_t* read_bytes); + void Decode(XMA_CONTEXT_DATA* data); + int PrepareDecoder(uint8_t* packet, int sample_rate, int channels); Memory* memory_ = nullptr; @@ -198,22 +201,34 @@ class XmaContext { std::mutex lock_; bool is_allocated_ = false; bool is_enabled_ = false; + // bool is_dirty_ = true; - // libav structures - AVCodec* codec_ = nullptr; - AVCodecContext* context_ = nullptr; - AVFrame* decoded_frame_ = nullptr; - AVPacket* packet_ = nullptr; - WmaProExtraData extra_data_; + // ffmpeg structures + AVPacket* av_packet_ = nullptr; + AVCodec* av_codec_ = nullptr; + AVCodecContext* av_context_ = nullptr; + AVFrame* av_frame_ = nullptr; + // uint32_t decoded_consumed_samples_ = 0; // TODO do this dynamically + // int decoded_idx_ = -1; - bool partial_frame_saved_ = false; - bool partial_frame_size_known_ = false; - size_t partial_frame_total_size_bits_ = 0; - size_t partial_frame_start_offset_bits_ = 0; - size_t partial_frame_offset_bits_ = 0; // blah internal don't use this - std::vector partial_frame_buffer_; + // bool partial_frame_saved_ = false; + // bool partial_frame_size_known_ = false; + // size_t partial_frame_total_size_bits_ = 0; + // size_t partial_frame_start_offset_bits_ = 0; + // size_t partial_frame_offset_bits_ = 0; // blah internal don't use this + // std::vector partial_frame_buffer_; + uint32_t packets_skip_ = 0; - uint8_t* current_frame_ = nullptr; + // bool split_frame_pending_ = false; + uint32_t split_frame_len_ = 0; + uint32_t split_frame_len_partial_ = 0; + // first byte contains bit offset information + std::array xma_frame_; + + // uint8_t* current_frame_ = nullptr; + // conversion buffer for 2 channel frame + std::array raw_frame_; + // std::vector current_frame_ = std::vector(0); }; } // namespace apu diff --git a/src/xenia/apu/xma_helpers.h b/src/xenia/apu/xma_helpers.h index c22c70c25..593d2d071 100644 --- a/src/xenia/apu/xma_helpers.h +++ b/src/xenia/apu/xma_helpers.h @@ -2,7 +2,7 @@ ****************************************************************************** * Xenia : Xbox 360 Emulator Research Project * ****************************************************************************** - * Copyright 2015 Ben Vanik. All rights reserved. * + * Copyright 2021 Ben Vanik. All rights reserved. * * Released under the BSD license - see LICENSE in the root for more details. * ****************************************************************************** */ @@ -18,6 +18,8 @@ namespace xe { namespace apu { namespace xma { +static const uint32_t kMaxFrameLength = 0x7FFF; + // Get number of frames that /begin/ in this packet. uint32_t GetPacketFrameCount(uint8_t* packet) { return (uint8_t)(packet[0] >> 2); @@ -27,11 +29,12 @@ uint32_t GetPacketFrameCount(uint8_t* packet) { uint32_t GetPacketFrameOffset(uint8_t* packet) { uint32_t val = (uint16_t)(((packet[0] & 0x3) << 13) | (packet[1] << 5) | (packet[2] >> 3)); - if (val == 0x7FFF) { - return -1; - } else { - return val + 32; - } + // if (val > kBitsPerPacket - kBitsPerHeader) { + // // There is no data in this packet + // return -1; + // } else { + return val + 32; + // } } uint32_t GetPacketMetadata(uint8_t* packet) {