Add comments explaining how the voice processing works

2012-11-15 16:57:33 +01:00 · 2012-11-15 16:57:33 +01:00 · 5a2d8661d7
parent aa90f799b7
commit 5a2d8661d7
1 changed files with 53 additions and 6 deletions
--- a/Source/Core/Core/Src/HW/DSPHLE/UCodes/UCode_NewAX_Voice.h
+++ b/Source/Core/Core/Src/HW/DSPHLE/UCodes/UCode_NewAX_Voice.h
@ -89,7 +89,9 @@ inline void AcceleratorSetup(AXPB* pb, u32* cur_addr)
 	acc_cur_addr = cur_addr;
 }
-// Reads a sample from the simulated accelerator.
+// Reads a sample from the simulated accelerator. Also handles looping and
 // disabling streams that reached the end (this is done by an exception raised
 // by the accelerator on real hardware).
 inline u16 AcceleratorGetSample()
 {
 	u16 ret;
@ -98,6 +100,7 @@ inline u16 AcceleratorGetSample()
 	{
 		case 0x00:	// ADPCM
 		{
 			// ADPCM decoding, not much to explain here.
 			if ((*acc_cur_addr & 15) == 0)
 			{
 				acc_pb->adpcm.pred_scale = DSP::ReadARAM((*acc_cur_addr & ~15) >> 1);
@ -148,14 +151,24 @@ inline u16 AcceleratorGetSample()
 			return 0;
 	}
 	// Have we reached the end address?
 	//
 	// On real hardware, this would raise an interrupt that is handled by the
 	// UCode. We simulate what this interrupt does here.
 	if (*acc_cur_addr >= acc_end_addr)
 	{
 		// If we are really at the end (and we don't simply have cur_addr >
 		// end_addr all the time), loop back to loop_addr.
 		if ((*acc_cur_addr & ~0x1F) == (acc_end_addr & ~0x1F))
 			*acc_cur_addr = acc_loop_addr;
 		// Simulate an ACC overflow interrupt.
 		if (acc_pb->audio_addr.looping)
 		{
 			// Set the ADPCM infos to continue processing at loop_addr.
 			//
 			// For some reason, yn1 and yn2 aren't set if the voice is not of
 			// stream type. This is what the AX UCode does and I don't really
 			// know why.
 			acc_pb->adpcm.pred_scale = acc_pb->adpcm_loop_info.pred_scale;
 			if (!acc_pb->is_stream)
 			{
@ -165,6 +178,7 @@ inline u16 AcceleratorGetSample()
 		}
 		else
 		{
 			// Non looping voice reached the end -> running = 0.
 			acc_pb->running = 0;
 		}
 	}
@ -181,12 +195,31 @@ inline void GetInputSamples(AXPB& pb, s16* samples)
 	// TODO: support polyphase interpolation if coefficients are available.
 	if (pb.src_type == SRCTYPE_POLYPHASE || pb.src_type == SRCTYPE_LINEAR)
 	{
 		// Convert the input to a higher or lower sample rate using a linear
 		// interpolation algorithm. The input to output ratio is set in
 		// pb.src.ratio, which is a floating point num stored as a 32b integer:
 		//  * Upper 16 bits of the ratio are the integer part
 		//  * Lower 16 bits are the decimal part
 		u32 ratio = HILO_TO_32(pb.src.ratio);
 		// We start getting samples not from sample 0, but 0.<cur_addr_frac>.
 		// This avoids discontinuties in the audio stream, especially with very
 		// low ratios which interpolate a lot of values between two "real"
 		// samples.
 		u32 curr_pos = pb.src.cur_addr_frac;
 		u32 real_samples_needed = (32 * ratio + curr_pos) >> 16;
 		s16 real_samples[130];		// Max supported ratio is 4
 		// Compute the number of real samples we will need to read from the
 		// data source. We need to output 32 samples, so we need to read
 		// 32 * ratio + curr_pos samples. The maximum possible ratio available
 		// on the DSP is 4.0, so at most we will read 128 real samples.
 		s16 real_samples[130];
 		u32 real_samples_needed = (32 * ratio + curr_pos) >> 16;
 		// The first two real samples are the ones we read at the previous
 		// iteration. That way we can interpolate before having read 2 new
 		// samples from the accelerator.
 		//
 		// The next real samples are read from the accelerator.
 		real_samples[0] = pb.src.last_samples[2];
 		real_samples[1] = pb.src.last_samples[3];
 		for (u32 i = 0; i < real_samples_needed; ++i)
@ -194,17 +227,24 @@ inline void GetInputSamples(AXPB& pb, s16* samples)
 		for (u32 i = 0; i < 32; ++i)
 		{
 			// Get our current integer and fractional position. The integer
 			// position is used to get the two samples around us. The
 			// fractional position is used to compute the linear interpolation
 			// between these two samples.
 			u32 curr_int_pos = (curr_pos >> 16);
 			s32 curr_frac_pos = curr_pos & 0xFFFF;
 			s16 samp1 = real_samples[curr_int_pos];
 			s16 samp2 = real_samples[curr_int_pos + 1];
 			// Linear interpolation: s1 + (s2 - s1) * pos
 			s16 sample = samp1 + (s16)(((samp2 - samp1) * (s32)curr_frac_pos) >> 16);
 			samples[i] = sample;
 			curr_pos += ratio;
 		}
 		// Update the last_samples array. A bit tricky because we can't know
 		// for sure we have more than 4 real samples in our array.
 		if (real_samples_needed >= 2)
 			memcpy(pb.src.last_samples, &real_samples[real_samples_needed + 2 - 4], 4 * sizeof (u16));
 		else
@ -216,21 +256,28 @@ inline void GetInputSamples(AXPB& pb, s16* samples)
 	}
 	else // SRCTYPE_NEAREST
 	{
 		// No sample rate conversion here: simply read 32 samples from the
 		// accelerator to the output buffer.
 		for (u32 i = 0; i < 32; ++i)
 			samples[i] = AcceleratorGetSample();
 		memcpy(pb.src.last_samples, samples + 28, 4 * sizeof (u16));
 	}
 	// Update current position in the PB.
 	pb.audio_addr.cur_addr_hi = (u16)(cur_addr >> 16);
 	pb.audio_addr.cur_addr_lo = (u16)(cur_addr & 0xFFFF);
 }
-// Mix samples to an output buffer, with optional volume ramping.
+// Add samples to an output buffer, with optional volume ramping.
 inline void MixAdd(int* out, const s16* input, u16* pvol, bool ramp)
 {
 	u16& volume = pvol[0];
 	u16 volume_delta = pvol[1];
 	// If volume ramping is disabled, set volume_delta to 0. That way, the
 	// mixing loop can avoid testing if volume ramping is enabled at each step,
 	// and just add volume_delta.
 	if (!ramp)
 		volume_delta = 0;
@ -242,7 +289,7 @@ inline void MixAdd(int* out, const s16* input, u16* pvol, bool ramp)
 	}
 }
-// Process 1ms of audio from a PB and mix it to the buffers.
+// Process 1ms of audio (32 samples) from a PB and mix it to the buffers.
 inline void Process1ms(AXPB& pb, const AXBuffers& buffers)
 {
 	// If the voice is not running, nothing to do.