pcsx2/pcsx2/Mdec.cpp

509 lines
11 KiB
C++

// SPDX-FileCopyrightText: 2002-2023 PCSX2 Dev Team
// SPDX-License-Identifier: GPL-2.0+
/* This code was based on the FPSE v0.08 Mdec decoder*/
#include <stdio.h>
#include <string.h>
#include "Common.h"
#include "Mdec.h"
#include "IopHw.h"
struct
{
u32 command;
u32 status;
u16* rl;
int rlsize;
} mdec;
struct config_mdec
{
u32 Mdec;
};
struct config_mdec Config;
u32 mdecArr2[0x100000] = {0};
u32 mdecMem[0x100000]; //watherver large size. //Memory only used to get DMA data and not really for anything else.
//Sould be optimized(the funcs. that use it) to read IOP RAM direcly.
#define PSXM(x) ((uptr)mdecMem + x)
int iq_y[DCTSIZE2], iq_uv[DCTSIZE2];
static void idct1(int* block)
{
const int val = RANGE(DESCALE(block[0], PASS1_BITS + 3));
for (int i = 0; i < DCTSIZE2; i++)
block[i] = val;
}
void idct(int* block, int k)
{
int tmp0, tmp1, tmp2, tmp3, tmp4, tmp5, tmp6, tmp7;
int z5, z10, z11, z12, z13;
int* ptr;
if (!k)
{
idct1(block);
return;
}
ptr = block;
for (int i = 0; i < DCTSIZE; i++, ptr++)
{
if ((ptr[DCTSIZE * 1] | ptr[DCTSIZE * 2] | ptr[DCTSIZE * 3] |
ptr[DCTSIZE * 4] | ptr[DCTSIZE * 5] | ptr[DCTSIZE * 6] |
ptr[DCTSIZE * 7]) == 0)
{
ptr[DCTSIZE * 0] =
ptr[DCTSIZE * 1] =
ptr[DCTSIZE * 2] =
ptr[DCTSIZE * 3] =
ptr[DCTSIZE * 4] =
ptr[DCTSIZE * 5] =
ptr[DCTSIZE * 6] =
ptr[DCTSIZE * 7] =
ptr[DCTSIZE * 0];
continue;
}
z10 = ptr[DCTSIZE * 0] + ptr[DCTSIZE * 4];
z11 = ptr[DCTSIZE * 0] - ptr[DCTSIZE * 4];
z13 = ptr[DCTSIZE * 2] + ptr[DCTSIZE * 6];
z12 = MULTIPLY(ptr[DCTSIZE * 2] - ptr[DCTSIZE * 6], FIX_1_414213562) - z13;
tmp0 = z10 + z13;
tmp3 = z10 - z13;
tmp1 = z11 + z12;
tmp2 = z11 - z12;
z13 = ptr[DCTSIZE * 3] + ptr[DCTSIZE * 5];
z10 = ptr[DCTSIZE * 3] - ptr[DCTSIZE * 5];
z11 = ptr[DCTSIZE * 1] + ptr[DCTSIZE * 7];
z12 = ptr[DCTSIZE * 1] - ptr[DCTSIZE * 7];
z5 = MULTIPLY(z12 - z10, FIX_1_847759065);
tmp7 = z11 + z13;
tmp6 = MULTIPLY(z10, FIX_2_613125930) + z5 - tmp7;
tmp5 = MULTIPLY(z11 - z13, FIX_1_414213562) - tmp6;
tmp4 = MULTIPLY(z12, FIX_1_082392200) - z5 + tmp5;
ptr[DCTSIZE * 0] = (tmp0 + tmp7);
ptr[DCTSIZE * 7] = (tmp0 - tmp7);
ptr[DCTSIZE * 1] = (tmp1 + tmp6);
ptr[DCTSIZE * 6] = (tmp1 - tmp6);
ptr[DCTSIZE * 2] = (tmp2 + tmp5);
ptr[DCTSIZE * 5] = (tmp2 - tmp5);
ptr[DCTSIZE * 4] = (tmp3 + tmp4);
ptr[DCTSIZE * 3] = (tmp3 - tmp4);
}
ptr = block;
for (int i = 0; i < DCTSIZE; i++, ptr += DCTSIZE)
{
if ((ptr[1] | ptr[2] | ptr[3] | ptr[4] | ptr[5] | ptr[6] |
ptr[7]) == 0)
{
ptr[0] =
ptr[1] =
ptr[2] =
ptr[3] =
ptr[4] =
ptr[5] =
ptr[6] =
ptr[7] =
RANGE(DESCALE(ptr[0], PASS1_BITS + 3));
;
continue;
}
z10 = ptr[0] + ptr[4];
z11 = ptr[0] - ptr[4];
z13 = ptr[2] + ptr[6];
z12 = MULTIPLY(ptr[2] - ptr[6], FIX_1_414213562) - z13;
tmp0 = z10 + z13;
tmp3 = z10 - z13;
tmp1 = z11 + z12;
tmp2 = z11 - z12;
z13 = ptr[3] + ptr[5];
z10 = ptr[3] - ptr[5];
z11 = ptr[1] + ptr[7];
z12 = ptr[1] - ptr[7];
z5 = MULTIPLY(z12 - z10, FIX_1_847759065);
tmp7 = z11 + z13;
tmp6 = MULTIPLY(z10, FIX_2_613125930) + z5 - tmp7;
tmp5 = MULTIPLY(z11 - z13, FIX_1_414213562) - tmp6;
tmp4 = MULTIPLY(z12, FIX_1_082392200) - z5 + tmp5;
ptr[0] = RANGE(DESCALE(tmp0 + tmp7, PASS1_BITS + 3));
;
ptr[7] = RANGE(DESCALE(tmp0 - tmp7, PASS1_BITS + 3));
;
ptr[1] = RANGE(DESCALE(tmp1 + tmp6, PASS1_BITS + 3));
;
ptr[6] = RANGE(DESCALE(tmp1 - tmp6, PASS1_BITS + 3));
;
ptr[2] = RANGE(DESCALE(tmp2 + tmp5, PASS1_BITS + 3));
;
ptr[5] = RANGE(DESCALE(tmp2 - tmp5, PASS1_BITS + 3));
;
ptr[4] = RANGE(DESCALE(tmp3 + tmp4, PASS1_BITS + 3));
;
ptr[3] = RANGE(DESCALE(tmp3 - tmp4, PASS1_BITS + 3));
;
}
}
void mdecInit(void)
{
Config.Mdec = 0; //XXXXXXXXXXXXXXXXX 0 or 1 // 1 is black and white decoding
mdec.rl = (u16*)PSXM(0);
//mdec.rl = (u16*)&psxM[0x100000];
mdec.command = 0;
mdec.status = 0;
round_init();
}
void mdecWrite0(u32 data)
{
MDEC_LOG("mdec0 write %lx", data);
mdec.command = data;
if ((data & 0xf5ff0000) == 0x30000000)
{
mdec.rlsize = data & 0xffff;
}
}
void mdecWrite1(u32 data)
{
MDEC_LOG("mdec1 write %lx", data);
if (data & 0x80000000)
{
// mdec reset
round_init();
// mdecInit();
}
}
u32 mdecRead0(void)
{
MDEC_LOG("mdec0 read %lx", mdec.command);
return mdec.command;
}
u32 mdecRead1(void)
{
MDEC_LOG("mdec1 read %lx", mdec.status);
return mdec.status;
}
void psxDma0(u32 adr, u32 bcr, u32 chcr)
{
const int cmd = mdec.command;
MDEC_LOG("DMA0 %lx %lx %lx", adr, bcr, chcr);
if (chcr != 0x01000201)
return;
// bcr LSBs are the blocksize in words
// bcr MSBs are the number of block
const int size = (bcr >> 16) * (bcr & 0xffff);
if (size < 0)
{
// Need to investigate what happen if the transfer is huge
Console.Error("psxDma0 DMA transfer overflow !");
return;
}
for (int i = 0; i < (size); i++)
{
*(u32*)PSXM(((i + 0) * 4)) = iopMemRead32(adr + ((i + 0) * 4));
if (i < 20)
MDEC_LOG(" data %08X %08X ", iopMemRead32((adr & 0x00FFFFFF) + (i * 4)), *(u32*)PSXM((i * 4)));
}
if (cmd == 0x40000001)
{
u8* p = (u8*)PSXM(0); //u8 *p = (u8*)PSXM(adr);
iqtab_init(iq_y, p);
iqtab_init(iq_uv, p + 64);
}
else if ((cmd & 0xf5ff0000) == 0x30000000)
{
mdec.rl = (u16*)PSXM(0); //mdec.rl = (u16*)PSXM(adr);
}
HW_DMA0_CHCR &= ~0x01000000;
psxDmaInterrupt(0);
}
void psxDma1(u32 adr, u32 bcr, u32 chcr)
{
int blk[DCTSIZE2 * 6];
unsigned short* image;
MDEC_LOG("DMA1 %lx %lx %lx (cmd = %lx)", adr, bcr, chcr, mdec.command);
if (chcr != 0x01000200)
return;
// bcr LSBs are the blocksize in words
// bcr MSBs are the number of block
int size = (bcr >> 16) * (bcr & 0xffff);
const int size2 = (bcr >> 16) * (bcr & 0xffff);
if (size < 0)
{
// Need to investigate what happen if the transfer is huge
Console.Error("psxDma1 DMA transfer overflow !");
return;
}
image = (u16*)mdecArr2; //(u16*)PSXM(0); //image = (u16*)PSXM(adr);
if (mdec.command & 0x08000000)
{
for (; size > 0; size -= (16 * 16) / 2, image += (16 * 16))
{
mdec.rl = rl2blk(blk, mdec.rl);
yuv2rgb15(blk, image);
}
}
else
{
for (; size > 0; size -= (24 * 16) / 2, image += (24 * 16))
{
mdec.rl = rl2blk(blk, mdec.rl);
yuv2rgb24(blk, (u8*)image);
}
}
for (int i = 0; i < (size2); i++)
{
iopMemWrite32(((adr & 0x00FFFFFF) + (i * 4) + 0), mdecArr2[i]);
if (i < 20)
MDEC_LOG(" data %08X %08X ", iopMemRead32((adr & 0x00FFFFFF) + (i * 4)), mdecArr2[i]);
}
HW_DMA1_CHCR &= ~0x01000000;
psxDmaInterrupt(1);
}
static int zscan[DCTSIZE2] = {
0, 1, 8, 16, 9, 2, 3, 10,
17, 24, 32, 25, 18, 11, 4, 5,
12, 19, 26, 33, 40, 48, 41, 34,
27, 20, 13, 6, 7, 14, 21, 28,
35, 42, 49, 56, 57, 50, 43, 36,
29, 22, 15, 23, 30, 37, 44, 51,
58, 59, 52, 45, 38, 31, 39, 46,
53, 60, 61, 54, 47, 55, 62, 63};
static int aanscales[DCTSIZE2] = {
16384, 22725, 21407, 19266, 16384, 12873, 8867, 4520,
22725, 31521, 29692, 26722, 22725, 17855, 12299, 6270,
21407, 29692, 27969, 25172, 21407, 16819, 11585, 5906,
19266, 26722, 25172, 22654, 19266, 15137, 10426, 5315,
16384, 22725, 21407, 19266, 16384, 12873, 8867, 4520,
12873, 17855, 16819, 15137, 12873, 10114, 6967, 3552,
8867, 12299, 11585, 10426, 8867, 6967, 4799, 2446,
4520, 6270, 5906, 5315, 4520, 3552, 2446, 1247};
void iqtab_init(int* iqtab, unsigned char* iq_y)
{
int i;
for (i = 0; i < DCTSIZE2; i++)
{
iqtab[i] = iq_y[i] * aanscales[zscan[i]] >> (CONST_BITS14 - IFAST_SCALE_BITS);
}
}
unsigned short* rl2blk(int* blk, unsigned short* mdec_rl)
{
int i, k, q_scale, rl;
int* iqtab;
memset(blk, 0, 6 * DCTSIZE2 * 4);
iqtab = iq_uv;
for (i = 0; i < 6; i++)
{ // decode blocks (Cr,Cb,Y1,Y2,Y3,Y4)
if (i > 1)
iqtab = iq_y;
// zigzag transformation
rl = *mdec_rl++;
q_scale = RUNOF(rl);
blk[0] = iqtab[0] * VALOF(rl);
for (k = 0;;)
{
rl = *mdec_rl++;
if (rl == NOP)
break;
k += RUNOF(rl) + 1; // skip level zero-coefficients
if (k > 63)
break;
blk[zscan[k]] = (VALOF(rl) * iqtab[k] * q_scale) / 8; // / 16;
}
idct(blk, k + 1);
blk += DCTSIZE2;
}
return mdec_rl;
}
unsigned char roundtbl[256 * 3];
void round_init(void)
{
int i;
for (i = 0; i < 256; i++)
{
roundtbl[i] = 0;
roundtbl[i + 256] = i;
roundtbl[i + 512] = 255;
}
}
void yuv2rgb15(int* blk, unsigned short* image)
{
int* Yblk = blk + DCTSIZE2 * 2;
int Cb, Cr, R, G, B;
int* Cbblk = blk;
int* Crblk = blk + DCTSIZE2;
if (!(Config.Mdec & 0x1))
for (int y = 0; y < 16; y += 2, Crblk += 4, Cbblk += 4, Yblk += 8, image += 24)
{
if (y == 8)
Yblk += DCTSIZE2;
for (int x = 0; x < 4; x++, image += 2, Crblk++, Cbblk++, Yblk += 2)
{
Cr = *Crblk;
Cb = *Cbblk;
R = MULR(Cr);
G = MULG(Cb) + MULG2(Cr);
B = MULB(Cb);
RGB15(0, Yblk[0]);
RGB15(1, Yblk[1]);
RGB15(16, Yblk[8]);
RGB15(17, Yblk[9]);
Cr = *(Crblk + 4);
Cb = *(Cbblk + 4);
R = MULR(Cr);
G = MULG(Cb) + MULG2(Cr);
B = MULB(Cb);
RGB15(8, Yblk[DCTSIZE2 + 0]);
RGB15(9, Yblk[DCTSIZE2 + 1]);
RGB15(24, Yblk[DCTSIZE2 + 8]);
RGB15(25, Yblk[DCTSIZE2 + 9]);
}
}
else
for (int y = 0; y < 16; y += 2, Yblk += 8, image += 24)
{
if (y == 8)
Yblk += DCTSIZE2;
for (int x = 0; x < 4; x++, image += 2, Yblk += 2)
{
RGB15BW(0, Yblk[0]);
RGB15BW(1, Yblk[1]);
RGB15BW(16, Yblk[8]);
RGB15BW(17, Yblk[9]);
RGB15BW(8, Yblk[DCTSIZE2 + 0]);
RGB15BW(9, Yblk[DCTSIZE2 + 1]);
RGB15BW(24, Yblk[DCTSIZE2 + 8]);
RGB15BW(25, Yblk[DCTSIZE2 + 9]);
}
}
}
void yuv2rgb24(int* blk, unsigned char* image)
{
int* Yblk = blk + DCTSIZE2 * 2;
int Cb, Cr, R, G, B;
int* Cbblk = blk;
int* Crblk = blk + DCTSIZE2;
if (!(Config.Mdec & 0x1))
for (int y = 0; y < 16; y += 2, Crblk += 4, Cbblk += 4, Yblk += 8, image += 24 * 3)
{
if (y == 8)
Yblk += DCTSIZE2;
for (int x = 0; x < 4; x++, image += 6, Crblk++, Cbblk++, Yblk += 2)
{
Cr = *Crblk;
Cb = *Cbblk;
R = MULR(Cr);
G = MULG(Cb) + MULG2(Cr);
B = MULB(Cb);
RGB24(0, Yblk[0]);
RGB24(1 * 3, Yblk[1]);
RGB24(16 * 3, Yblk[8]);
RGB24(17 * 3, Yblk[9]);
Cr = *(Crblk + 4);
Cb = *(Cbblk + 4);
R = MULR(Cr);
G = MULG(Cb) + MULG2(Cr);
B = MULB(Cb);
RGB24(8 * 3, Yblk[DCTSIZE2 + 0]);
RGB24(9 * 3, Yblk[DCTSIZE2 + 1]);
RGB24(24 * 3, Yblk[DCTSIZE2 + 8]);
RGB24(25 * 3, Yblk[DCTSIZE2 + 9]);
}
}
else
for (int y = 0; y < 16; y += 2, Yblk += 8, image += 24 * 3)
{
if (y == 8)
Yblk += DCTSIZE2;
for (int x = 0; x < 4; x++, image += 6, Yblk += 2)
{
RGB24BW(0, Yblk[0]);
RGB24BW(1 * 3, Yblk[1]);
RGB24BW(16 * 3, Yblk[8]);
RGB24BW(17 * 3, Yblk[9]);
RGB24BW(8 * 3, Yblk[DCTSIZE2 + 0]);
RGB24BW(9 * 3, Yblk[DCTSIZE2 + 1]);
RGB24BW(24 * 3, Yblk[DCTSIZE2 + 8]);
RGB24BW(25 * 3, Yblk[DCTSIZE2 + 9]);
}
}
}
//todo: psxmode: add mdec savestate support
//int SaveState::mdecFreeze() {
// Freeze(mdec);
// Freeze(iq_y);
// Freeze(iq_uv);
//
// return 0;
//
//}