454 lines
12 KiB
C++
454 lines
12 KiB
C++
#pragma once
|
|
#include "oslib/oslib.h"
|
|
|
|
extern u8* vq_codebook;
|
|
extern u32 palette_index;
|
|
extern u32 palette_ram[1024];
|
|
extern bool pal_needs_update,fog_needs_update,KillTex;
|
|
extern u32 pal_rev_256[4];
|
|
extern u32 pal_rev_16[64];
|
|
extern u32 _pal_rev_256[4];
|
|
extern u32 _pal_rev_16[64];
|
|
|
|
extern u32 detwiddle[2][8][1024];
|
|
|
|
//Pixel buffer class (realy helpfull ;) )
|
|
struct PixelBuffer
|
|
{
|
|
u16* p_buffer_start;
|
|
u16* p_current_line;
|
|
u16* p_current_pixel;
|
|
|
|
u32 pixels_per_line;
|
|
|
|
void init(void* data,u32 ppl_bytes)
|
|
{
|
|
p_buffer_start=p_current_line=p_current_pixel=(u16*)data;
|
|
pixels_per_line=ppl_bytes/sizeof(u16);
|
|
}
|
|
__forceinline void prel(u32 x,u16 value)
|
|
{
|
|
p_current_pixel[x]=value;
|
|
}
|
|
|
|
__forceinline void prel(u32 x,u32 y,u16 value)
|
|
{
|
|
p_current_pixel[y*pixels_per_line+x]=value;
|
|
}
|
|
|
|
__forceinline void rmovex(u32 value)
|
|
{
|
|
p_current_pixel+=value;
|
|
}
|
|
__forceinline void rmovey(u32 value)
|
|
{
|
|
p_current_line+=pixels_per_line*value;
|
|
p_current_pixel=p_current_line;
|
|
}
|
|
__forceinline void amove(u32 x_m,u32 y_m)
|
|
{
|
|
//p_current_pixel=p_buffer_start;
|
|
p_current_line=p_buffer_start+pixels_per_line*y_m;
|
|
p_current_pixel=p_current_line + x_m;
|
|
}
|
|
};
|
|
|
|
void palette_update();
|
|
|
|
#define clamp(minv,maxv,x) min(maxv,max(minv,x))
|
|
|
|
#define ARGB1555( word ) ( ((word>>15)&1) | (((word>>10) & 0x1F)<<11) | (((word>>5) & 0x1F)<<6) | (((word>>0) & 0x1F)<<1) )
|
|
// ARGB8888(unpack_1_to_8[(word>>15)&1],unpack_5_to_8[(word>>10) & 0x1F],
|
|
//unpack_5_to_8[(word>>5) & 0x1F],unpack_5_to_8[word&0x1F])
|
|
|
|
#define ARGB565( word ) ( (((word>>0)&0x1F)<<0) | (((word>>5)&0x3F)<<5) | (((word>>11)&0x1F)<<11) )
|
|
|
|
//ARGB8888(0xFF,unpack_5_to_8[(word>>11) & 0x1F], unpack_6_to_8[(word>>5) & 0x3F],unpack_5_to_8[word&0x1F])
|
|
//( 0xFF000000 | unpack_5_to_8[(word>>11) & 0x1F] | unpack_5_to_8[(word>>5) & 0x3F]<<8 | unpack_5_to_8[word&0x1F]<<16 )
|
|
|
|
#define ARGB4444( word ) ( (((word>>0)&0xF)<<4) | (((word>>4)&0xF)<<8) | (((word>>8)&0xF)<<12) | (((word>>12)&0xF)<<0) )
|
|
//ARGB8888( (word&0xF000)>>(12-4),(word&0xF00)>>(8-4),(word&0xF0)>>(4-4),(word&0xF)<<4 )
|
|
|
|
#define ARGB8888( word ) ( (((word>>4)&0xF)<<4) | (((word>>12)&0xF)<<8) | (((word>>20)&0xF)<<12) | (((word>>28)&0xF)<<0) )
|
|
|
|
template<class PixelPacker>
|
|
__forceinline u32 YUV422(s32 Y,s32 Yu,s32 Yv)
|
|
{
|
|
Yu-=128;
|
|
Yv-=128;
|
|
|
|
//s32 B = (76283*(Y - 16) + 132252*(Yu - 128))>>16;
|
|
//s32 G = (76283*(Y - 16) - 53281 *(Yv - 128) - 25624*(Yu - 128))>>16;
|
|
//s32 R = (76283*(Y - 16) + 104595*(Yv - 128))>>16;
|
|
|
|
s32 R = Y + Yv*11/8; // Y + (Yv-128) * (11/8) ?
|
|
s32 G = Y - (Yu*11 + Yv*22)/32; // Y - (Yu-128) * (11/8) * 0.25 - (Yv-128) * (11/8) * 0.5 ?
|
|
s32 B = Y + Yu*110/64; // Y + (Yu-128) * (11/8) * 1.25 ?
|
|
|
|
return PixelPacker::packRGB(clamp(0,255,R),clamp(0,255,G),clamp(0,255,B));
|
|
}
|
|
|
|
#define twop(x,y,bcx,bcy) (detwiddle[0][bcy][x]+detwiddle[1][bcx][y])
|
|
|
|
//pixel packers !
|
|
struct pp_565
|
|
{
|
|
__forceinline static u32 packRGB(u8 R,u8 G,u8 B)
|
|
{
|
|
R>>=3;
|
|
G>>=2;
|
|
B>>=3;
|
|
return (R<<11) | (G<<5) | (B<<0);
|
|
}
|
|
};
|
|
|
|
//pixel convertors !
|
|
#define pixelcvt_start(name,x,y) template<class PixelPacker> \
|
|
struct name \
|
|
{ \
|
|
static const u32 xpp=x;\
|
|
static const u32 ypp=y; \
|
|
__forceinline static void Convert(PixelBuffer* pb,u8* data) \
|
|
{
|
|
|
|
#define pixelcvt_end } }
|
|
#define pixelcvt_next(name,x,y) pixelcvt_end; pixelcvt_start(name,x,y)
|
|
//Non twiddled
|
|
pixelcvt_start(conv565_PL,4,1)
|
|
{
|
|
//convert 4x1
|
|
u16* p_in=(u16*)data;
|
|
//0,0
|
|
pb->prel(0,ARGB565(p_in[0]));
|
|
//1,0
|
|
pb->prel(1,ARGB565(p_in[1]));
|
|
//2,0
|
|
pb->prel(2,ARGB565(p_in[2]));
|
|
//3,0
|
|
pb->prel(3,ARGB565(p_in[3]));
|
|
}
|
|
pixelcvt_next(conv1555_PL,4,1)
|
|
{
|
|
//convert 4x1
|
|
u16* p_in=(u16*)data;
|
|
//0,0
|
|
pb->prel(0,ARGB1555(p_in[0]));
|
|
//1,0
|
|
pb->prel(1,ARGB1555(p_in[1]));
|
|
//2,0
|
|
pb->prel(2,ARGB1555(p_in[2]));
|
|
//3,0
|
|
pb->prel(3,ARGB1555(p_in[3]));
|
|
}
|
|
pixelcvt_next(conv4444_PL,4,1)
|
|
{
|
|
//convert 4x1
|
|
u16* p_in=(u16*)data;
|
|
//0,0
|
|
pb->prel(0,ARGB4444(p_in[0]));
|
|
//1,0
|
|
pb->prel(1,ARGB4444(p_in[1]));
|
|
//2,0
|
|
pb->prel(2,ARGB4444(p_in[2]));
|
|
//3,0
|
|
pb->prel(3,ARGB4444(p_in[3]));
|
|
}
|
|
pixelcvt_next(convYUV_PL,4,1)
|
|
{
|
|
//convert 4x1 4444 to 4x1 8888
|
|
u32* p_in=(u32*)data;
|
|
|
|
|
|
s32 Y0 = (p_in[0]>>8) &255; //
|
|
s32 Yu = (p_in[0]>>0) &255; //p_in[0]
|
|
s32 Y1 = (p_in[0]>>24) &255; //p_in[3]
|
|
s32 Yv = (p_in[0]>>16) &255; //p_in[2]
|
|
|
|
//0,0
|
|
pb->prel(0,YUV422<PixelPacker>(Y0,Yu,Yv));
|
|
//1,0
|
|
pb->prel(1,YUV422<PixelPacker>(Y1,Yu,Yv));
|
|
|
|
//next 4 bytes
|
|
p_in+=1;
|
|
|
|
Y0 = (p_in[0]>>8) &255; //
|
|
Yu = (p_in[0]>>0) &255; //p_in[0]
|
|
Y1 = (p_in[0]>>24) &255; //p_in[3]
|
|
Yv = (p_in[0]>>16) &255; //p_in[2]
|
|
|
|
//0,0
|
|
pb->prel(2,YUV422<PixelPacker>(Y0,Yu,Yv));
|
|
//1,0
|
|
pb->prel(3,YUV422<PixelPacker>(Y1,Yu,Yv));
|
|
}
|
|
pixelcvt_next(convBMP_PL,4,1)
|
|
{
|
|
u16* p_in=(u16*)data;
|
|
pb->prel(0,ARGB8888(p_in[0]));
|
|
pb->prel(1,ARGB8888(p_in[1]));
|
|
pb->prel(2,ARGB8888(p_in[2]));
|
|
pb->prel(3,ARGB8888(p_in[3]));
|
|
}
|
|
pixelcvt_end;
|
|
//twiddled
|
|
pixelcvt_start(conv565_TW,2,2)
|
|
{
|
|
//convert 4x1 565 to 4x1 8888
|
|
u16* p_in=(u16*)data;
|
|
//0,0
|
|
pb->prel(0,0,ARGB565(p_in[0]));
|
|
//0,1
|
|
pb->prel(0,1,ARGB565(p_in[1]));
|
|
//1,0
|
|
pb->prel(1,0,ARGB565(p_in[2]));
|
|
//1,1
|
|
pb->prel(1,1,ARGB565(p_in[3]));
|
|
}
|
|
pixelcvt_next(conv1555_TW,2,2)
|
|
{
|
|
//convert 4x1 565 to 4x1 8888
|
|
u16* p_in=(u16*)data;
|
|
//0,0
|
|
pb->prel(0,0,ARGB1555(p_in[0]));
|
|
//0,1
|
|
pb->prel(0,1,ARGB1555(p_in[1]));
|
|
//1,0
|
|
pb->prel(1,0,ARGB1555(p_in[2]));
|
|
//1,1
|
|
pb->prel(1,1,ARGB1555(p_in[3]));
|
|
}
|
|
pixelcvt_next(conv4444_TW,2,2)
|
|
{
|
|
//convert 4x1 565 to 4x1 8888
|
|
u16* p_in=(u16*)data;
|
|
//0,0
|
|
pb->prel(0,0,ARGB4444(p_in[0]));
|
|
//0,1
|
|
pb->prel(0,1,ARGB4444(p_in[1]));
|
|
//1,0
|
|
pb->prel(1,0,ARGB4444(p_in[2]));
|
|
//1,1
|
|
pb->prel(1,1,ARGB4444(p_in[3]));
|
|
}
|
|
pixelcvt_next(convYUV_TW,2,2)
|
|
{
|
|
//convert 4x1 4444 to 4x1 8888
|
|
u16* p_in=(u16*)data;
|
|
|
|
|
|
s32 Y0 = (p_in[0]>>8) &255; //
|
|
s32 Yu = (p_in[0]>>0) &255; //p_in[0]
|
|
s32 Y1 = (p_in[2]>>8) &255; //p_in[3]
|
|
s32 Yv = (p_in[2]>>0) &255; //p_in[2]
|
|
|
|
//0,0
|
|
pb->prel(0,0,YUV422<PixelPacker>(Y0,Yu,Yv));
|
|
//1,0
|
|
pb->prel(1,0,YUV422<PixelPacker>(Y1,Yu,Yv));
|
|
|
|
//next 4 bytes
|
|
//p_in+=2;
|
|
|
|
Y0 = (p_in[1]>>8) &255; //
|
|
Yu = (p_in[1]>>0) &255; //p_in[0]
|
|
Y1 = (p_in[3]>>8) &255; //p_in[3]
|
|
Yv = (p_in[3]>>0) &255; //p_in[2]
|
|
|
|
//0,1
|
|
pb->prel(0,1,YUV422<PixelPacker>(Y0,Yu,Yv));
|
|
//1,1
|
|
pb->prel(1,1,YUV422<PixelPacker>(Y1,Yu,Yv));
|
|
}
|
|
pixelcvt_next(convBMP_TW,2,2)
|
|
{
|
|
u16* p_in=(u16*)data;
|
|
pb->prel(0,0,ARGB8888(p_in[0]));
|
|
pb->prel(0,1,ARGB8888(p_in[1]));
|
|
pb->prel(1,0,ARGB8888(p_in[2]));
|
|
pb->prel(1,1,ARGB8888(p_in[3]));
|
|
}
|
|
pixelcvt_end;
|
|
|
|
pixelcvt_start(convPAL4_TW,4,4)
|
|
{
|
|
u8* p_in=(u8*)data;
|
|
u32* pal=&palette_ram[palette_index];
|
|
|
|
pb->prel(0,0,pal[p_in[0]&0xF]);
|
|
pb->prel(0,1,pal[(p_in[0]>>4)&0xF]);p_in++;
|
|
pb->prel(1,0,pal[p_in[0]&0xF]);
|
|
pb->prel(1,1,pal[(p_in[0]>>4)&0xF]);p_in++;
|
|
|
|
pb->prel(0,2,pal[p_in[0]&0xF]);
|
|
pb->prel(0,3,pal[(p_in[0]>>4)&0xF]);p_in++;
|
|
pb->prel(1,2,pal[p_in[0]&0xF]);
|
|
pb->prel(1,3,pal[(p_in[0]>>4)&0xF]);p_in++;
|
|
|
|
pb->prel(2,0,pal[p_in[0]&0xF]);
|
|
pb->prel(2,1,pal[(p_in[0]>>4)&0xF]);p_in++;
|
|
pb->prel(3,0,pal[p_in[0]&0xF]);
|
|
pb->prel(3,1,pal[(p_in[0]>>4)&0xF]);p_in++;
|
|
|
|
pb->prel(2,2,pal[p_in[0]&0xF]);
|
|
pb->prel(2,3,pal[(p_in[0]>>4)&0xF]);p_in++;
|
|
pb->prel(3,2,pal[p_in[0]&0xF]);
|
|
pb->prel(3,3,pal[(p_in[0]>>4)&0xF]);p_in++;
|
|
}
|
|
pixelcvt_next(convPAL8_TW,2,4)
|
|
{
|
|
u8* p_in=(u8*)data;
|
|
u32* pal=&palette_ram[palette_index];
|
|
|
|
pb->prel(0,0,pal[p_in[0]]);p_in++;
|
|
pb->prel(0,1,pal[p_in[0]]);p_in++;
|
|
pb->prel(1,0,pal[p_in[0]]);p_in++;
|
|
pb->prel(1,1,pal[p_in[0]]);p_in++;
|
|
|
|
pb->prel(0,2,pal[p_in[0]]);p_in++;
|
|
pb->prel(0,3,pal[p_in[0]]);p_in++;
|
|
pb->prel(1,2,pal[p_in[0]]);p_in++;
|
|
pb->prel(1,3,pal[p_in[0]]);p_in++;
|
|
}
|
|
pixelcvt_end;
|
|
//handler functions
|
|
template<class PixelConvertor>
|
|
void texture_PL(PixelBuffer* pb,u8* p_in,u32 Width,u32 Height)
|
|
{
|
|
pb->amove(0,0);
|
|
|
|
Height/=PixelConvertor::ypp;
|
|
Width/=PixelConvertor::xpp;
|
|
|
|
for (u32 y=0;y<Height;y++)
|
|
{
|
|
for (u32 x=0;x<Width;x++)
|
|
{
|
|
u8* p = p_in;
|
|
PixelConvertor::Convert(pb,p);
|
|
p_in+=8;
|
|
|
|
pb->rmovex(PixelConvertor::xpp);
|
|
}
|
|
pb->rmovey(PixelConvertor::ypp);
|
|
}
|
|
}
|
|
|
|
template<class PixelConvertor>
|
|
void texture_TW(PixelBuffer* pb,u8* p_in,u32 Width,u32 Height)
|
|
{
|
|
pb->amove(0,0);
|
|
|
|
const u32 divider=PixelConvertor::xpp*PixelConvertor::ypp;
|
|
|
|
unsigned long bcx_,bcy_;
|
|
bcx_=bitscanrev(Width);
|
|
bcy_=bitscanrev(Height);
|
|
const u32 bcx=bcx_-3;
|
|
const u32 bcy=bcy_-3;
|
|
|
|
for (u32 y=0;y<Height;y+=PixelConvertor::ypp)
|
|
{
|
|
for (u32 x=0;x<Width;x+=PixelConvertor::xpp)
|
|
{
|
|
u8* p = &p_in[(twop(x,y,bcx,bcy)/divider)<<3];
|
|
PixelConvertor::Convert(pb,p);
|
|
|
|
pb->rmovex(PixelConvertor::xpp);
|
|
}
|
|
pb->rmovey(PixelConvertor::ypp);
|
|
}
|
|
}
|
|
|
|
template<class PixelConvertor>
|
|
void texture_VQ(PixelBuffer* pb,u8* p_in,u32 Width,u32 Height)
|
|
{
|
|
p_in+=256*4*2;
|
|
pb->amove(0,0);
|
|
|
|
const u32 divider=PixelConvertor::xpp*PixelConvertor::ypp;
|
|
unsigned long bcx_,bcy_;
|
|
bcx_=bitscanrev(Width);
|
|
bcy_=bitscanrev(Height);
|
|
const u32 bcx=bcx_-3;
|
|
const u32 bcy=bcy_-3;
|
|
|
|
for (u32 y=0;y<Height;y+=PixelConvertor::ypp)
|
|
{
|
|
for (u32 x=0;x<Width;x+=PixelConvertor::xpp)
|
|
{
|
|
u8 p = p_in[twop(x,y,bcx,bcy)/divider];
|
|
PixelConvertor::Convert(pb,&vq_codebook[p*8]);
|
|
|
|
pb->rmovex(PixelConvertor::xpp);
|
|
}
|
|
pb->rmovey(PixelConvertor::ypp);
|
|
}
|
|
}
|
|
|
|
//We ask the compiler to generate the templates here
|
|
//;)
|
|
//planar formats !
|
|
template void texture_PL<conv565_PL<pp_565> >(PixelBuffer* pb,u8* p_in,u32 Width,u32 Height);
|
|
template void texture_PL<conv1555_PL<pp_565> >(PixelBuffer* pb,u8* p_in,u32 Width,u32 Height);
|
|
template void texture_PL<conv4444_PL<pp_565> >(PixelBuffer* pb,u8* p_in,u32 Width,u32 Height);
|
|
template void texture_PL<convYUV_PL<pp_565> >(PixelBuffer* pb,u8* p_in,u32 Width,u32 Height);
|
|
template void texture_PL<convBMP_PL<pp_565> >(PixelBuffer* pb,u8* p_in,u32 Width,u32 Height);
|
|
|
|
//twiddled formats !
|
|
template void texture_TW<conv565_TW<pp_565> >(PixelBuffer* pb,u8* p_in,u32 Width,u32 Height);
|
|
template void texture_TW<conv1555_TW<pp_565> >(PixelBuffer* pb,u8* p_in,u32 Width,u32 Height);
|
|
template void texture_TW<conv4444_TW<pp_565> >(PixelBuffer* pb,u8* p_in,u32 Width,u32 Height);
|
|
template void texture_TW<convYUV_TW<pp_565> >(PixelBuffer* pb,u8* p_in,u32 Width,u32 Height);
|
|
template void texture_TW<convBMP_TW<pp_565> >(PixelBuffer* pb,u8* p_in,u32 Width,u32 Height);
|
|
|
|
template void texture_TW<convPAL4_TW<pp_565> >(PixelBuffer* pb,u8* p_in,u32 Width,u32 Height);
|
|
template void texture_TW<convPAL8_TW<pp_565> >(PixelBuffer* pb,u8* p_in,u32 Width,u32 Height);
|
|
|
|
//VQ formats !
|
|
template void texture_VQ<conv565_TW<pp_565> >(PixelBuffer* pb,u8* p_in,u32 Width,u32 Height);
|
|
template void texture_VQ<conv1555_TW<pp_565> >(PixelBuffer* pb,u8* p_in,u32 Width,u32 Height);
|
|
template void texture_VQ<conv4444_TW<pp_565> >(PixelBuffer* pb,u8* p_in,u32 Width,u32 Height);
|
|
template void texture_VQ<convYUV_TW<pp_565> >(PixelBuffer* pb,u8* p_in,u32 Width,u32 Height);
|
|
template void texture_VQ<convBMP_TW<pp_565> >(PixelBuffer* pb,u8* p_in,u32 Width,u32 Height);
|
|
|
|
//Planar
|
|
#define tex565_PL texture_PL<conv565_PL<pp_565> >
|
|
#define tex1555_PL texture_PL<conv1555_PL<pp_565> >
|
|
#define tex4444_PL texture_PL<conv4444_PL<pp_565> >
|
|
#define texYUV422_PL texture_PL<convYUV_PL<pp_565> >
|
|
#define texBMP_PL texture_PL<convBMP_PL<pp_565> >
|
|
|
|
//Twiddle
|
|
#define tex565_TW texture_TW<conv565_TW<pp_565> >
|
|
#define tex1555_TW texture_TW<conv1555_TW<pp_565> >
|
|
#define tex4444_TW texture_TW<conv4444_TW<pp_565> >
|
|
#define texYUV422_TW texture_TW<convYUV_TW<pp_565> >
|
|
#define texBMP_TW texture_TW<convBMP_TW<pp_565> >
|
|
#define texPAL4_TW texture_TW<convPAL4_TW<pp_565> >
|
|
#define texPAL8_TW texture_TW<convPAL8_TW<pp_565> >
|
|
|
|
//VQ
|
|
#define tex565_VQ texture_VQ<conv565_TW<pp_565> >
|
|
#define tex1555_VQ texture_VQ<conv1555_TW<pp_565> >
|
|
#define tex4444_VQ texture_VQ<conv4444_TW<pp_565> >
|
|
#define texYUV422_VQ texture_VQ<convYUV_TW<pp_565> >
|
|
#define texBMP_VQ texture_VQ<convBMP_TW<pp_565> >
|
|
|
|
void texture_PAL4(PixelBuffer* pb,u8* p_in,u32 Width,u32 Height);
|
|
void texture_PAL8(PixelBuffer* pb,u8* p_in,u32 Width,u32 Height);
|
|
|
|
|
|
#define Is_64_Bit(addr) ((addr &0x1000000)==0)
|
|
|
|
//vram_block, vramLockCBFP on plugin headers
|
|
|
|
|
|
u32 vramlock_ConvAddrtoOffset64(u32 Address);
|
|
u32 vramlock_ConvOffset32toOffset64(u32 offset32);
|
|
|
|
void vramlock_Unlock_block(vram_block* block);
|
|
vram_block* vramlock_Lock_32(u32 start_offset32,u32 end_offset32,void* userdata);
|
|
vram_block* vramlock_Lock_64(u32 start_offset64,u32 end_offset64,void* userdata);
|
|
|
|
void vram_LockedWrite(u32 offset64); |