mirror of https://github.com/PCSX2/pcsx2.git
469 lines
11 KiB
C++
469 lines
11 KiB
C++
/* Pcsx2 - Pc Ps2 Emulator
|
|
* Copyright (C) 2002-2008 Pcsx2 Team
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation; either version 2 of the License, or
|
|
* (at your option) any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA
|
|
*/
|
|
|
|
/* This code was based on the FPSE v0.08 Mdec decoder*/
|
|
|
|
#include "PrecompiledHeader.h"
|
|
|
|
#include <stdio.h>
|
|
#include <string.h>
|
|
#include "Common.h"
|
|
|
|
#include "Mdec.h"
|
|
#include "IopHw.h"
|
|
|
|
struct {
|
|
u32 command;
|
|
u32 status;
|
|
u16 *rl;
|
|
int rlsize;
|
|
} mdec;
|
|
|
|
struct config_mdec {
|
|
u32 Mdec;
|
|
};
|
|
struct config_mdec Config;
|
|
|
|
u32 mdecArr2[0x100000] = { 0 };
|
|
|
|
u32 mdecMem[0x100000]; //watherver large size. //Memory only used to get DMA data and not really for anything else.
|
|
//Sould be optimized(the funcs. that use it) to read IOP RAM direcly.
|
|
#define PSXM(x) ((uptr)mdecMem + x)
|
|
|
|
|
|
int iq_y[DCTSIZE2],iq_uv[DCTSIZE2];
|
|
|
|
static void idct1(int *block)
|
|
{
|
|
int i, val;
|
|
|
|
val = RANGE(DESCALE(block[0], PASS1_BITS+3));
|
|
|
|
for(i=0;i<DCTSIZE2;i++)
|
|
block[i]=val;
|
|
}
|
|
|
|
void idct(int *block,int k)
|
|
{
|
|
int tmp0, tmp1, tmp2, tmp3, tmp4, tmp5, tmp6, tmp7;
|
|
int z5, z10, z11, z12, z13;
|
|
int *ptr;
|
|
int i;
|
|
|
|
if (!k) { idct1(block); return; }
|
|
|
|
ptr = block;
|
|
for (i = 0; i< DCTSIZE; i++,ptr++) {
|
|
|
|
if ((ptr[DCTSIZE*1] | ptr[DCTSIZE*2] | ptr[DCTSIZE*3] |
|
|
ptr[DCTSIZE*4] | ptr[DCTSIZE*5] | ptr[DCTSIZE*6] |
|
|
ptr[DCTSIZE*7]) == 0) {
|
|
ptr[DCTSIZE*0] =
|
|
ptr[DCTSIZE*1] =
|
|
ptr[DCTSIZE*2] =
|
|
ptr[DCTSIZE*3] =
|
|
ptr[DCTSIZE*4] =
|
|
ptr[DCTSIZE*5] =
|
|
ptr[DCTSIZE*6] =
|
|
ptr[DCTSIZE*7] =
|
|
ptr[DCTSIZE*0];
|
|
|
|
continue;
|
|
}
|
|
|
|
z10 = ptr[DCTSIZE*0] + ptr[DCTSIZE*4];
|
|
z11 = ptr[DCTSIZE*0] - ptr[DCTSIZE*4];
|
|
z13 = ptr[DCTSIZE*2] + ptr[DCTSIZE*6];
|
|
z12 = MULTIPLY(ptr[DCTSIZE*2] - ptr[DCTSIZE*6], FIX_1_414213562) - z13;
|
|
|
|
tmp0 = z10 + z13;
|
|
tmp3 = z10 - z13;
|
|
tmp1 = z11 + z12;
|
|
tmp2 = z11 - z12;
|
|
|
|
z13 = ptr[DCTSIZE*3] + ptr[DCTSIZE*5];
|
|
z10 = ptr[DCTSIZE*3] - ptr[DCTSIZE*5];
|
|
z11 = ptr[DCTSIZE*1] + ptr[DCTSIZE*7];
|
|
z12 = ptr[DCTSIZE*1] - ptr[DCTSIZE*7];
|
|
|
|
z5 = MULTIPLY(z12 - z10, FIX_1_847759065);
|
|
tmp7 = z11 + z13;
|
|
tmp6 = MULTIPLY(z10, FIX_2_613125930) + z5 - tmp7;
|
|
tmp5 = MULTIPLY(z11 - z13, FIX_1_414213562) - tmp6;
|
|
tmp4 = MULTIPLY(z12, FIX_1_082392200) - z5 + tmp5;
|
|
|
|
ptr[DCTSIZE*0] = (tmp0 + tmp7);
|
|
ptr[DCTSIZE*7] = (tmp0 - tmp7);
|
|
ptr[DCTSIZE*1] = (tmp1 + tmp6);
|
|
ptr[DCTSIZE*6] = (tmp1 - tmp6);
|
|
ptr[DCTSIZE*2] = (tmp2 + tmp5);
|
|
ptr[DCTSIZE*5] = (tmp2 - tmp5);
|
|
ptr[DCTSIZE*4] = (tmp3 + tmp4);
|
|
ptr[DCTSIZE*3] = (tmp3 - tmp4);
|
|
|
|
}
|
|
|
|
ptr = block;
|
|
for (i = 0; i < DCTSIZE; i++ ,ptr+=DCTSIZE) {
|
|
|
|
if ((ptr[1] | ptr[2] | ptr[3] | ptr[4] | ptr[5] | ptr[6] |
|
|
ptr[7]) == 0) {
|
|
ptr[0] =
|
|
ptr[1] =
|
|
ptr[2] =
|
|
ptr[3] =
|
|
ptr[4] =
|
|
ptr[5] =
|
|
ptr[6] =
|
|
ptr[7] =
|
|
RANGE(DESCALE(ptr[0], PASS1_BITS+3));;
|
|
|
|
continue;
|
|
}
|
|
|
|
z10 = ptr[0] + ptr[4];
|
|
z11 = ptr[0] - ptr[4];
|
|
z13 = ptr[2] + ptr[6];
|
|
z12 = MULTIPLY(ptr[2] - ptr[6], FIX_1_414213562) - z13;
|
|
|
|
tmp0 = z10 + z13;
|
|
tmp3 = z10 - z13;
|
|
tmp1 = z11 + z12;
|
|
tmp2 = z11 - z12;
|
|
|
|
z13 = ptr[3] + ptr[5];
|
|
z10 = ptr[3] - ptr[5];
|
|
z11 = ptr[1] + ptr[7];
|
|
z12 = ptr[1] - ptr[7];
|
|
|
|
z5 = MULTIPLY(z12 - z10, FIX_1_847759065);
|
|
tmp7 = z11 + z13;
|
|
tmp6 = MULTIPLY(z10, FIX_2_613125930) + z5 - tmp7;
|
|
tmp5 = MULTIPLY(z11 - z13, FIX_1_414213562) - tmp6;
|
|
tmp4 = MULTIPLY(z12, FIX_1_082392200) - z5 + tmp5;
|
|
|
|
ptr[0] = RANGE(DESCALE(tmp0 + tmp7, PASS1_BITS+3));;
|
|
ptr[7] = RANGE(DESCALE(tmp0 - tmp7, PASS1_BITS+3));;
|
|
ptr[1] = RANGE(DESCALE(tmp1 + tmp6, PASS1_BITS+3));;
|
|
ptr[6] = RANGE(DESCALE(tmp1 - tmp6, PASS1_BITS+3));;
|
|
ptr[2] = RANGE(DESCALE(tmp2 + tmp5, PASS1_BITS+3));;
|
|
ptr[5] = RANGE(DESCALE(tmp2 - tmp5, PASS1_BITS+3));;
|
|
ptr[4] = RANGE(DESCALE(tmp3 + tmp4, PASS1_BITS+3));;
|
|
ptr[3] = RANGE(DESCALE(tmp3 - tmp4, PASS1_BITS+3));;
|
|
|
|
}
|
|
}
|
|
|
|
void mdecInit(void) {
|
|
|
|
Config.Mdec = 0; //XXXXXXXXXXXXXXXXX 0 or 1 // 1 is black and white decoding
|
|
|
|
mdec.rl = (u16*)PSXM(0);
|
|
//mdec.rl = (u16*)&psxM[0x100000];
|
|
mdec.command = 0;
|
|
mdec.status = 0;
|
|
round_init();
|
|
}
|
|
|
|
|
|
void mdecWrite0(u32 data) {
|
|
MDEC_LOG("mdec0 write %lx", data);
|
|
|
|
mdec.command = data;
|
|
if ((data&0xf5ff0000)==0x30000000) {
|
|
mdec.rlsize = data&0xffff;
|
|
}
|
|
}
|
|
|
|
void mdecWrite1(u32 data) {
|
|
MDEC_LOG("mdec1 write %lx", data);
|
|
|
|
if (data&0x80000000) { // mdec reset
|
|
round_init();
|
|
// mdecInit();
|
|
}
|
|
}
|
|
|
|
u32 mdecRead0(void) {
|
|
MDEC_LOG("mdec0 read %lx", mdec.command);
|
|
|
|
return mdec.command;
|
|
}
|
|
|
|
u32 mdecRead1(void) {
|
|
MDEC_LOG("mdec1 read %lx", mdec.status);
|
|
|
|
return mdec.status;
|
|
}
|
|
|
|
void psxDma0(u32 adr, u32 bcr, u32 chcr) {
|
|
int cmd = mdec.command;
|
|
|
|
MDEC_LOG("DMA0 %lx %lx %lx", adr, bcr, chcr);
|
|
|
|
if (chcr != 0x01000201) return;
|
|
|
|
// bcr LSBs are the blocksize in words
|
|
// bcr MSBs are the number of block
|
|
int size = (bcr >> 16)*(bcr & 0xffff);
|
|
if (size < 0) {
|
|
// Need to investigate what happen if the transfer is huge
|
|
Console.Error("psxDma0 DMA transfer overflow !");
|
|
return;
|
|
}
|
|
|
|
for (int i = 0; i<(size); i++) {
|
|
*(u32*)PSXM(((i + 0) * 4)) = iopMemRead32(adr + ((i + 0) * 4));
|
|
if (i <20)
|
|
MDEC_LOG(" data %08X %08X ", iopMemRead32((adr & 0x00FFFFFF) + (i * 4)), *(u32*)PSXM((i * 4)));
|
|
}
|
|
|
|
|
|
if (cmd == 0x40000001) {
|
|
u8 *p = (u8*)PSXM(0); //u8 *p = (u8*)PSXM(adr);
|
|
iqtab_init(iq_y, p);
|
|
iqtab_init(iq_uv, p + 64);
|
|
}
|
|
else if ((cmd & 0xf5ff0000) == 0x30000000) {
|
|
mdec.rl = (u16*)PSXM(0); //mdec.rl = (u16*)PSXM(adr);
|
|
}
|
|
|
|
HW_DMA0_CHCR &= ~0x01000000;
|
|
psxDmaInterrupt(0);
|
|
}
|
|
|
|
void psxDma1(u32 adr, u32 bcr, u32 chcr) {
|
|
int blk[DCTSIZE2*6];
|
|
unsigned short *image;
|
|
|
|
MDEC_LOG("DMA1 %lx %lx %lx (cmd = %lx)", adr, bcr, chcr, mdec.command);
|
|
|
|
if (chcr != 0x01000200) return;
|
|
// bcr LSBs are the blocksize in words
|
|
// bcr MSBs are the number of block
|
|
int size = (bcr >> 16)*(bcr & 0xffff);
|
|
int size2 = (bcr >> 16)*(bcr & 0xffff);
|
|
if (size < 0) {
|
|
// Need to investigate what happen if the transfer is huge
|
|
Console.Error("psxDma1 DMA transfer overflow !");
|
|
return;
|
|
}
|
|
|
|
image = (u16*)mdecArr2;//(u16*)PSXM(0); //image = (u16*)PSXM(adr);
|
|
|
|
if (mdec.command&0x08000000) {
|
|
for (;size>0;size-=(16*16)/2,image+=(16*16)) {
|
|
mdec.rl = rl2blk(blk,mdec.rl);
|
|
yuv2rgb15(blk,image);
|
|
}
|
|
} else {
|
|
for (;size>0;size-=(24*16)/2,image+=(24*16)) {
|
|
mdec.rl = rl2blk(blk,mdec.rl);
|
|
yuv2rgb24(blk,(u8 *)image);
|
|
}
|
|
}
|
|
|
|
for (int i = 0; i<(size2); i++) {
|
|
iopMemWrite32(((adr & 0x00FFFFFF) + (i * 4) + 0), mdecArr2[i]);
|
|
if (i <20)
|
|
MDEC_LOG(" data %08X %08X ", iopMemRead32((adr & 0x00FFFFFF) + (i * 4)), mdecArr2[i]);
|
|
}
|
|
|
|
HW_DMA1_CHCR &= ~0x01000000;
|
|
psxDmaInterrupt(1);
|
|
}
|
|
|
|
static int zscan[DCTSIZE2] = {
|
|
0 ,1 ,8 ,16,9 ,2 ,3 ,10,
|
|
17,24,32,25,18,11,4 ,5 ,
|
|
12,19,26,33,40,48,41,34,
|
|
27,20,13,6 ,7 ,14,21,28,
|
|
35,42,49,56,57,50,43,36,
|
|
29,22,15,23,30,37,44,51,
|
|
58,59,52,45,38,31,39,46,
|
|
53,60,61,54,47,55,62,63
|
|
};
|
|
|
|
static int aanscales[DCTSIZE2] = {
|
|
16384, 22725, 21407, 19266, 16384, 12873, 8867, 4520,
|
|
22725, 31521, 29692, 26722, 22725, 17855, 12299, 6270,
|
|
21407, 29692, 27969, 25172, 21407, 16819, 11585, 5906,
|
|
19266, 26722, 25172, 22654, 19266, 15137, 10426, 5315,
|
|
16384, 22725, 21407, 19266, 16384, 12873, 8867, 4520,
|
|
12873, 17855, 16819, 15137, 12873, 10114, 6967, 3552,
|
|
8867, 12299, 11585, 10426, 8867, 6967, 4799, 2446,
|
|
4520, 6270, 5906, 5315, 4520, 3552, 2446, 1247
|
|
};
|
|
|
|
void iqtab_init(int *iqtab,unsigned char *iq_y)
|
|
{
|
|
int i;
|
|
|
|
for(i=0;i<DCTSIZE2;i++) {
|
|
iqtab[i] =iq_y[i] *aanscales[zscan[i]]>>(CONST_BITS14-IFAST_SCALE_BITS);
|
|
}
|
|
}
|
|
|
|
unsigned short* rl2blk(int *blk,unsigned short *mdec_rl) {
|
|
int i,k,q_scale,rl;
|
|
int *iqtab;
|
|
|
|
memset (blk, 0, 6*DCTSIZE2*4);
|
|
iqtab = iq_uv;
|
|
for(i=0;i<6;i++) { // decode blocks (Cr,Cb,Y1,Y2,Y3,Y4)
|
|
if (i>1) iqtab = iq_y;
|
|
|
|
// zigzag transformation
|
|
rl = *mdec_rl++;
|
|
q_scale = RUNOF(rl);
|
|
blk[0] = iqtab[0]*VALOF(rl);
|
|
for(k = 0;;) {
|
|
rl = *mdec_rl++;
|
|
if (rl==NOP) break;
|
|
k += RUNOF(rl)+1; // skip level zero-coefficients
|
|
if (k > 63) break;
|
|
blk[zscan[k]] = (VALOF(rl) * iqtab[k] * q_scale) / 8; // / 16;
|
|
}
|
|
|
|
idct(blk,k+1);
|
|
blk+=DCTSIZE2;
|
|
}
|
|
return mdec_rl;
|
|
}
|
|
|
|
unsigned char roundtbl[256*3];
|
|
|
|
void round_init(void) {
|
|
int i;
|
|
for(i=0;i<256;i++) {
|
|
roundtbl[i]=0;
|
|
roundtbl[i+256]=i;
|
|
roundtbl[i+512]=255;
|
|
}
|
|
}
|
|
|
|
void yuv2rgb15(int *blk,unsigned short *image) {
|
|
int x,y;
|
|
int *Yblk = blk+DCTSIZE2*2;
|
|
int Cb,Cr,R,G,B;
|
|
int *Cbblk = blk;
|
|
int *Crblk = blk+DCTSIZE2;
|
|
|
|
if (!(Config.Mdec&0x1))
|
|
for (y=0;y<16;y+=2,Crblk+=4,Cbblk+=4,Yblk+=8,image+=24) {
|
|
if (y==8) Yblk+=DCTSIZE2;
|
|
for (x=0;x<4;x++,image+=2,Crblk++,Cbblk++,Yblk+=2) {
|
|
Cr = *Crblk;
|
|
Cb = *Cbblk;
|
|
R = MULR(Cr);
|
|
G = MULG(Cb) + MULG2(Cr);
|
|
B = MULB(Cb);
|
|
|
|
RGB15(0, Yblk[0]);
|
|
RGB15(1, Yblk[1]);
|
|
RGB15(16, Yblk[8]);
|
|
RGB15(17, Yblk[9]);
|
|
|
|
Cr = *(Crblk+4);
|
|
Cb = *(Cbblk+4);
|
|
R = MULR(Cr);
|
|
G = MULG(Cb) + MULG2(Cr);
|
|
B = MULB(Cb);
|
|
|
|
RGB15(8, Yblk[DCTSIZE2+0]);
|
|
RGB15(9, Yblk[DCTSIZE2+1]);
|
|
RGB15(24, Yblk[DCTSIZE2+8]);
|
|
RGB15(25, Yblk[DCTSIZE2+9]);
|
|
}
|
|
} else
|
|
for (y=0;y<16;y+=2,Yblk+=8,image+=24) {
|
|
if (y==8) Yblk+=DCTSIZE2;
|
|
for (x=0;x<4;x++,image+=2,Yblk+=2) {
|
|
RGB15BW(0, Yblk[0]);
|
|
RGB15BW(1, Yblk[1]);
|
|
RGB15BW(16, Yblk[8]);
|
|
RGB15BW(17, Yblk[9]);
|
|
|
|
RGB15BW(8, Yblk[DCTSIZE2+0]);
|
|
RGB15BW(9, Yblk[DCTSIZE2+1]);
|
|
RGB15BW(24, Yblk[DCTSIZE2+8]);
|
|
RGB15BW(25, Yblk[DCTSIZE2+9]);
|
|
}
|
|
}
|
|
}
|
|
|
|
void yuv2rgb24(int *blk,unsigned char *image) {
|
|
int x,y;
|
|
int *Yblk = blk+DCTSIZE2*2;
|
|
int Cb,Cr,R,G,B;
|
|
int *Cbblk = blk;
|
|
int *Crblk = blk+DCTSIZE2;
|
|
|
|
if (!(Config.Mdec&0x1))
|
|
for (y=0;y<16;y+=2,Crblk+=4,Cbblk+=4,Yblk+=8,image+=24*3) {
|
|
if (y==8) Yblk+=DCTSIZE2;
|
|
for (x=0;x<4;x++,image+=6,Crblk++,Cbblk++,Yblk+=2) {
|
|
Cr = *Crblk;
|
|
Cb = *Cbblk;
|
|
R = MULR(Cr);
|
|
G = MULG(Cb) + MULG2(Cr);
|
|
B = MULB(Cb);
|
|
|
|
RGB24(0, Yblk[0]);
|
|
RGB24(1*3, Yblk[1]);
|
|
RGB24(16*3, Yblk[8]);
|
|
RGB24(17*3, Yblk[9]);
|
|
|
|
Cr = *(Crblk+4);
|
|
Cb = *(Cbblk+4);
|
|
R = MULR(Cr);
|
|
G = MULG(Cb) + MULG2(Cr);
|
|
B = MULB(Cb);
|
|
|
|
RGB24(8*3, Yblk[DCTSIZE2+0]);
|
|
RGB24(9*3, Yblk[DCTSIZE2+1]);
|
|
RGB24(24*3, Yblk[DCTSIZE2+8]);
|
|
RGB24(25*3, Yblk[DCTSIZE2+9]);
|
|
}
|
|
} else
|
|
for (y=0;y<16;y+=2,Yblk+=8,image+=24*3) {
|
|
if (y==8) Yblk+=DCTSIZE2;
|
|
for (x=0;x<4;x++,image+=6,Yblk+=2) {
|
|
RGB24BW(0, Yblk[0]);
|
|
RGB24BW(1*3, Yblk[1]);
|
|
RGB24BW(16*3, Yblk[8]);
|
|
RGB24BW(17*3, Yblk[9]);
|
|
|
|
RGB24BW(8*3, Yblk[DCTSIZE2+0]);
|
|
RGB24BW(9*3, Yblk[DCTSIZE2+1]);
|
|
RGB24BW(24*3, Yblk[DCTSIZE2+8]);
|
|
RGB24BW(25*3, Yblk[DCTSIZE2+9]);
|
|
}
|
|
}
|
|
}
|
|
|
|
//todo: psxmode: add mdec savestate support
|
|
//int SaveState::mdecFreeze() {
|
|
// Freeze(mdec);
|
|
// Freeze(iq_y);
|
|
// Freeze(iq_uv);
|
|
//
|
|
// return 0;
|
|
//
|
|
//}
|