724 lines
15 KiB
C
724 lines
15 KiB
C
/*
|
|
* Glide64 - Glide video plugin for Nintendo 64 emulators.
|
|
* Copyright (c) 2002 Dave2001
|
|
* Copyright (c) 2003-2009 Sergey 'Gonetz' Lipski
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation; either version 2 of the License, or
|
|
* any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program; if not, write to the Free Software
|
|
* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
|
|
*/
|
|
|
|
//****************************************************************
|
|
//
|
|
// Glide64 - Glide Plugin for Nintendo 64 emulators
|
|
// Project started on December 29th, 2001
|
|
//
|
|
// Authors:
|
|
// Dave2001, original author, founded the project in 2001, left it in 2002
|
|
// Gugaman, joined the project in 2002, left it in 2002
|
|
// Sergey 'Gonetz' Lipski, joined the project in 2002, main author since fall of 2002
|
|
// Hiroshi 'KoolSmoky' Morii, joined the project in 2007
|
|
//
|
|
//****************************************************************
|
|
//
|
|
// To modify Glide64:
|
|
// * Write your name and (optional)email, commented by your work, so I know who did it, and so that you can find which parts you modified when it comes time to send it to me.
|
|
// * Do NOT send me the whole project or file that you modified. Take out your modified code sections, and tell me where to put them. If people sent the whole thing, I would have many different versions, but no idea how to combine them all.
|
|
//
|
|
//****************************************************************
|
|
|
|
extern "C" void __declspec(naked) asmLoad8bCI (wxUIntPtr src, wxUIntPtr dst, int wid_64, int height, int line, int ext, wxUIntPtr pal)
|
|
{
|
|
_asm {
|
|
push ebp
|
|
mov ebp, esp
|
|
push ebx
|
|
push esi
|
|
push edi
|
|
|
|
mov ebx,[pal]
|
|
mov esi,[src]
|
|
mov edi,[dst]
|
|
mov ecx,[height]
|
|
y_loop:
|
|
push ecx
|
|
mov ecx,[wid_64]
|
|
x_loop:
|
|
push ecx
|
|
|
|
mov eax,[esi] // read all 4 pixels
|
|
bswap eax
|
|
add esi,4
|
|
mov edx,eax
|
|
|
|
// 1st dword output {
|
|
shr eax,15
|
|
and eax,0x1FE
|
|
mov cx,[ebx+eax]
|
|
ror cx,1
|
|
shl ecx,16
|
|
|
|
mov eax,edx
|
|
shr eax,23
|
|
and eax,0x1FE
|
|
mov cx,[ebx+eax]
|
|
ror cx,1
|
|
|
|
mov [edi],ecx
|
|
add edi,4
|
|
// }
|
|
|
|
// 2nd dword output {
|
|
mov eax,edx
|
|
shl eax,1
|
|
and eax,0x1FE
|
|
mov cx,[ebx+eax]
|
|
ror cx,1
|
|
shl ecx,16
|
|
|
|
shr edx,7
|
|
and edx,0x1FE
|
|
mov cx,[ebx+edx]
|
|
ror cx,1
|
|
|
|
mov [edi],ecx
|
|
add edi,4
|
|
// }
|
|
|
|
// * copy
|
|
mov eax,[esi] // read all 4 pixels
|
|
bswap eax
|
|
add esi,4
|
|
mov edx,eax
|
|
|
|
// 1st dword output {
|
|
shr eax,15
|
|
and eax,0x1FE
|
|
mov cx,[ebx+eax]
|
|
ror cx,1
|
|
shl ecx,16
|
|
|
|
mov eax,edx
|
|
shr eax,23
|
|
and eax,0x1FE
|
|
mov cx,[ebx+eax]
|
|
ror cx,1
|
|
|
|
mov [edi],ecx
|
|
add edi,4
|
|
// }
|
|
|
|
// 2nd dword output {
|
|
mov eax,edx
|
|
shl eax,1
|
|
and eax,0x1FE
|
|
mov cx,[ebx+eax]
|
|
ror cx,1
|
|
shl ecx,16
|
|
|
|
shr edx,7
|
|
and edx,0x1FE
|
|
mov cx,[ebx+edx]
|
|
ror cx,1
|
|
|
|
mov [edi],ecx
|
|
add edi,4
|
|
// }
|
|
// *
|
|
|
|
pop ecx
|
|
|
|
dec ecx
|
|
jnz x_loop
|
|
|
|
pop ecx
|
|
dec ecx
|
|
jz near end_y_loop
|
|
push ecx
|
|
|
|
mov eax,esi
|
|
add eax,[line]
|
|
mov esi,[src]
|
|
sub eax,esi
|
|
and eax,0x7FF
|
|
add esi,eax
|
|
add edi,[ext]
|
|
|
|
mov ecx,[wid_64]
|
|
x_loop_2:
|
|
push ecx
|
|
|
|
mov eax,[esi+4] // read all 4 pixels
|
|
bswap eax
|
|
mov edx,eax
|
|
|
|
// 1st dword output {
|
|
shr eax,15
|
|
and eax,0x1FE
|
|
mov cx,[ebx+eax]
|
|
ror cx,1
|
|
shl ecx,16
|
|
|
|
mov eax,edx
|
|
shr eax,23
|
|
and eax,0x1FE
|
|
mov cx,[ebx+eax]
|
|
ror cx,1
|
|
|
|
mov [edi],ecx
|
|
add edi,4
|
|
// }
|
|
|
|
// 2nd dword output {
|
|
mov eax,edx
|
|
shl eax,1
|
|
and eax,0x1FE
|
|
mov cx,[ebx+eax]
|
|
ror cx,1
|
|
shl ecx,16
|
|
|
|
shr edx,7
|
|
and edx,0x1FE
|
|
mov cx,[ebx+edx]
|
|
ror cx,1
|
|
|
|
mov [edi],ecx
|
|
add edi,4
|
|
// }
|
|
|
|
// * copy
|
|
mov eax,[esi] // read all 4 pixels
|
|
bswap eax
|
|
mov edx,esi
|
|
add edx,8
|
|
mov esi,[src]
|
|
sub edx,esi
|
|
and edx,0x7FF
|
|
add esi,edx
|
|
mov edx,eax
|
|
|
|
// 1st dword output {
|
|
shr eax,15
|
|
and eax,0x1FE
|
|
mov cx,[ebx+eax]
|
|
ror cx,1
|
|
shl ecx,16
|
|
|
|
mov eax,edx
|
|
shr eax,23
|
|
and eax,0x1FE
|
|
mov cx,[ebx+eax]
|
|
ror cx,1
|
|
|
|
mov [edi],ecx
|
|
add edi,4
|
|
// }
|
|
|
|
// 2nd dword output {
|
|
mov eax,edx
|
|
shl eax,1
|
|
and eax,0x1FE
|
|
mov cx,[ebx+eax]
|
|
ror cx,1
|
|
shl ecx,16
|
|
|
|
shr edx,7
|
|
and edx,0x1FE
|
|
mov cx,[ebx+edx]
|
|
ror cx,1
|
|
|
|
mov [edi],ecx
|
|
add edi,4
|
|
// }
|
|
// *
|
|
|
|
pop ecx
|
|
|
|
dec ecx
|
|
jnz x_loop_2
|
|
|
|
mov eax,esi
|
|
add eax,[line]
|
|
mov esi,[src]
|
|
sub eax,esi
|
|
and eax,0x7FF
|
|
add esi,eax
|
|
add edi,[ext]
|
|
|
|
pop ecx
|
|
dec ecx
|
|
jnz y_loop
|
|
|
|
end_y_loop:
|
|
pop edi
|
|
pop esi
|
|
pop ebx
|
|
mov esp, ebp
|
|
pop ebp
|
|
ret
|
|
}
|
|
}
|
|
|
|
extern "C" void __declspec(naked) asmLoad8bIA8 (wxUIntPtr src, wxUIntPtr dst, int wid_64, int height, int line, int ext, wxUIntPtr pal)
|
|
{
|
|
_asm {
|
|
push ebp
|
|
mov ebp, esp
|
|
push ebx
|
|
push esi
|
|
push edi
|
|
|
|
mov ebx,[pal]
|
|
mov esi,[src]
|
|
mov edi,[dst]
|
|
mov ecx,[height]
|
|
y_loop:
|
|
push ecx
|
|
mov ecx,[wid_64]
|
|
x_loop:
|
|
push ecx
|
|
|
|
mov eax,[esi] // read all 4 pixels
|
|
bswap eax
|
|
add esi,4
|
|
mov edx,eax
|
|
|
|
// 1st dword output {
|
|
shr eax,15
|
|
and eax,0x1FE
|
|
mov cx,[ebx+eax]
|
|
ror cx,8
|
|
shl ecx,16
|
|
|
|
mov eax,edx
|
|
shr eax,23
|
|
and eax,0x1FE
|
|
mov cx,[ebx+eax]
|
|
ror cx,8
|
|
|
|
mov [edi],ecx
|
|
add edi,4
|
|
// }
|
|
|
|
// 2nd dword output {
|
|
mov eax,edx
|
|
shl eax,1
|
|
and eax,0x1FE
|
|
mov cx,[ebx+eax]
|
|
ror cx,8
|
|
shl ecx,16
|
|
|
|
shr edx,7
|
|
and edx,0x1FE
|
|
mov cx,[ebx+edx]
|
|
ror cx,8
|
|
|
|
mov [edi],ecx
|
|
add edi,4
|
|
// }
|
|
|
|
// * copy
|
|
mov eax,[esi] // read all 4 pixels
|
|
bswap eax
|
|
add esi,4
|
|
mov edx,eax
|
|
|
|
// 1st dword output {
|
|
shr eax,15
|
|
and eax,0x1FE
|
|
mov cx,[ebx+eax]
|
|
ror cx,8
|
|
shl ecx,16
|
|
|
|
mov eax,edx
|
|
shr eax,23
|
|
and eax,0x1FE
|
|
mov cx,[ebx+eax]
|
|
ror cx,8
|
|
|
|
mov [edi],ecx
|
|
add edi,4
|
|
// }
|
|
|
|
// 2nd dword output {
|
|
mov eax,edx
|
|
shl eax,1
|
|
and eax,0x1FE
|
|
mov cx,[ebx+eax]
|
|
ror cx,8
|
|
shl ecx,16
|
|
|
|
shr edx,7
|
|
and edx,0x1FE
|
|
mov cx,[ebx+edx]
|
|
ror cx,8
|
|
|
|
mov [edi],ecx
|
|
add edi,4
|
|
// }
|
|
// *
|
|
|
|
pop ecx
|
|
|
|
dec ecx
|
|
jnz x_loop
|
|
|
|
pop ecx
|
|
dec ecx
|
|
jz near end_y_loop
|
|
push ecx
|
|
|
|
add esi,[line]
|
|
add edi,[ext]
|
|
|
|
mov ecx,[wid_64]
|
|
x_loop_2:
|
|
push ecx
|
|
|
|
mov eax,[esi+4] // read all 4 pixels
|
|
bswap eax
|
|
mov edx,eax
|
|
|
|
// 1st dword output {
|
|
shr eax,15
|
|
and eax,0x1FE
|
|
mov cx,[ebx+eax]
|
|
ror cx,8
|
|
shl ecx,16
|
|
|
|
mov eax,edx
|
|
shr eax,23
|
|
and eax,0x1FE
|
|
mov cx,[ebx+eax]
|
|
ror cx,8
|
|
|
|
mov [edi],ecx
|
|
add edi,4
|
|
// }
|
|
|
|
// 2nd dword output {
|
|
mov eax,edx
|
|
shl eax,1
|
|
and eax,0x1FE
|
|
mov cx,[ebx+eax]
|
|
ror cx,8
|
|
shl ecx,16
|
|
|
|
shr edx,7
|
|
and edx,0x1FE
|
|
mov cx,[ebx+edx]
|
|
ror cx,8
|
|
|
|
mov [edi],ecx
|
|
add edi,4
|
|
// }
|
|
|
|
// * copy
|
|
mov eax,[esi] // read all 4 pixels
|
|
bswap eax
|
|
add esi,8
|
|
mov edx,eax
|
|
|
|
// 1st dword output {
|
|
shr eax,15
|
|
and eax,0x1FE
|
|
mov cx,[ebx+eax]
|
|
ror cx,8
|
|
shl ecx,16
|
|
|
|
mov eax,edx
|
|
shr eax,23
|
|
and eax,0x1FE
|
|
mov cx,[ebx+eax]
|
|
ror cx,8
|
|
|
|
mov [edi],ecx
|
|
add edi,4
|
|
// }
|
|
|
|
// 2nd dword output {
|
|
mov eax,edx
|
|
shl eax,1
|
|
and eax,0x1FE
|
|
mov cx,[ebx+eax]
|
|
ror cx,8
|
|
shl ecx,16
|
|
|
|
shr edx,7
|
|
and edx,0x1FE
|
|
mov cx,[ebx+edx]
|
|
ror cx,8
|
|
|
|
mov [edi],ecx
|
|
add edi,4
|
|
// }
|
|
// *
|
|
|
|
pop ecx
|
|
|
|
dec ecx
|
|
jnz x_loop_2
|
|
|
|
add esi,[line]
|
|
add edi,[ext]
|
|
|
|
pop ecx
|
|
dec ecx
|
|
jnz y_loop
|
|
|
|
end_y_loop:
|
|
pop edi
|
|
pop esi
|
|
pop ebx
|
|
mov esp, ebp
|
|
pop ebp
|
|
ret
|
|
}
|
|
}
|
|
|
|
extern "C" void __declspec(naked) asmLoad8bIA4 (wxUIntPtr src, wxUIntPtr dst, int wid_64, int height, int line, int ext)
|
|
{
|
|
_asm {
|
|
push ebp
|
|
mov ebp, esp
|
|
push ebx
|
|
push esi
|
|
push edi
|
|
|
|
mov esi,[src]
|
|
mov edi,[dst]
|
|
mov ecx,[height]
|
|
y_loop:
|
|
push ecx
|
|
mov ecx,[wid_64]
|
|
x_loop:
|
|
mov eax,[esi] // read all 4 pixels
|
|
mov edx,eax
|
|
|
|
shr eax,4 //all alpha
|
|
shl edx,4
|
|
and eax,0x0F0F0F0F
|
|
and edx,0xF0F0F0F0
|
|
add esi,4
|
|
or eax,edx
|
|
|
|
mov [edi],eax // save dword
|
|
add edi,4
|
|
|
|
mov eax,[esi] // read all 4 pixels
|
|
mov edx,eax
|
|
|
|
shr eax,4 //all alpha
|
|
shl edx,4
|
|
and eax,0x0F0F0F0F
|
|
and edx,0xF0F0F0F0
|
|
add esi,4
|
|
or eax,edx
|
|
|
|
mov [edi],eax // save dword
|
|
add edi,4
|
|
// *
|
|
|
|
dec ecx
|
|
jnz x_loop
|
|
|
|
pop ecx
|
|
dec ecx
|
|
jz end_y_loop
|
|
push ecx
|
|
|
|
add esi,[line]
|
|
add edi,[ext]
|
|
|
|
mov ecx,[wid_64]
|
|
x_loop_2:
|
|
mov eax,[esi+4] // read both pixels
|
|
mov edx,eax
|
|
|
|
shr eax,4 //all alpha
|
|
shl edx,4
|
|
and eax,0x0F0F0F0F
|
|
and edx,0xF0F0F0F0
|
|
or eax,edx
|
|
|
|
mov [edi],eax //save dword
|
|
add edi,4
|
|
|
|
mov eax,[esi] // read both pixels
|
|
add esi,8
|
|
mov edx,eax
|
|
|
|
shr eax,4 //all alpha
|
|
shl edx,4
|
|
and eax,0x0F0F0F0F
|
|
and edx,0xF0F0F0F0
|
|
or eax,edx
|
|
|
|
mov [edi],eax //save dword
|
|
add edi,4
|
|
// *
|
|
|
|
dec ecx
|
|
jnz x_loop_2
|
|
|
|
add esi,[line]
|
|
add edi,[ext]
|
|
|
|
pop ecx
|
|
dec ecx
|
|
jnz y_loop
|
|
|
|
end_y_loop:
|
|
pop edi
|
|
pop esi
|
|
pop ebx
|
|
mov esp, ebp
|
|
pop ebp
|
|
ret
|
|
}
|
|
}
|
|
|
|
extern "C" void __declspec(naked) asmLoad8bI (wxUIntPtr src, int dst, wxUIntPtr wid_64, int height, int line, int ext)
|
|
{
|
|
_asm {
|
|
push ebp
|
|
mov ebp, esp
|
|
push ebx
|
|
push esi
|
|
push edi
|
|
|
|
mov esi,[src]
|
|
mov edi,[dst]
|
|
mov ecx,[height]
|
|
y_loop:
|
|
push ecx
|
|
mov ecx,[wid_64]
|
|
x_loop:
|
|
mov eax,[esi] // read all 4 pixels
|
|
add esi,4
|
|
|
|
mov [edi],eax // save dword
|
|
add edi,4
|
|
|
|
mov eax,[esi] // read all 4 pixels
|
|
add esi,4
|
|
|
|
mov [edi],eax // save dword
|
|
add edi,4
|
|
// *
|
|
|
|
dec ecx
|
|
jnz x_loop
|
|
|
|
pop ecx
|
|
dec ecx
|
|
jz end_y_loop
|
|
push ecx
|
|
|
|
add esi,[line]
|
|
add edi,[ext]
|
|
|
|
mov ecx,[wid_64]
|
|
x_loop_2:
|
|
mov eax,[esi+4] // read both pixels
|
|
|
|
mov [edi],eax //save dword
|
|
add edi,4
|
|
|
|
mov eax,[esi] // read both pixels
|
|
add esi,8
|
|
|
|
mov [edi],eax //save dword
|
|
add edi,4
|
|
// *
|
|
|
|
dec ecx
|
|
jnz x_loop_2
|
|
|
|
add esi,[line]
|
|
add edi,[ext]
|
|
|
|
pop ecx
|
|
dec ecx
|
|
jnz y_loop
|
|
|
|
end_y_loop:
|
|
pop edi
|
|
pop esi
|
|
pop ebx
|
|
mov esp, ebp
|
|
pop ebp
|
|
ret
|
|
}
|
|
}
|
|
|
|
//****************************************************************
|
|
// Size: 1, Format: 2
|
|
//
|
|
|
|
wxUint32 Load8bCI (wxUIntPtr dst, wxUIntPtr src, int wid_64, int height, int line, int real_width, int /*tile*/)
|
|
{
|
|
if (wid_64 < 1) wid_64 = 1;
|
|
if (height < 1) height = 1;
|
|
int ext = (real_width - (wid_64 << 3));
|
|
wxUIntPtr pal = wxPtrToUInt(rdp.pal_8);
|
|
|
|
switch (rdp.tlut_mode) {
|
|
case 0: //palette is not used
|
|
//in tlut DISABLE mode load CI texture as plain intensity texture instead of palette dereference.
|
|
//Thanks to angrylion for the advice
|
|
asmLoad8bI (src, dst, wid_64, height, line, ext);
|
|
return /*(0 << 16) | */GR_TEXFMT_ALPHA_8;
|
|
case 2: //color palette
|
|
ext <<= 1;
|
|
asmLoad8bCI (src, dst, wid_64, height, line, ext, pal);
|
|
return (1 << 16) | GR_TEXFMT_ARGB_1555;
|
|
default: //IA palette
|
|
ext <<= 1;
|
|
asmLoad8bIA8 (src, dst, wid_64, height, line, ext, pal);
|
|
return (1 << 16) | GR_TEXFMT_ALPHA_INTENSITY_88;
|
|
}
|
|
}
|
|
|
|
//****************************************************************
|
|
// Size: 1, Format: 3
|
|
//
|
|
|
|
wxUint32 Load8bIA (wxUIntPtr dst, wxUIntPtr src, int wid_64, int height, int line, int real_width, int tile)
|
|
{
|
|
if (rdp.tlut_mode != 0)
|
|
return Load8bCI (dst, src, wid_64, height, line, real_width, tile);
|
|
|
|
if (wid_64 < 1) wid_64 = 1;
|
|
if (height < 1) height = 1;
|
|
int ext = (real_width - (wid_64 << 3));
|
|
asmLoad8bIA4 (src, dst, wid_64, height, line, ext);
|
|
return /*(0 << 16) | */GR_TEXFMT_ALPHA_INTENSITY_44;
|
|
}
|
|
|
|
//****************************************************************
|
|
// Size: 1, Format: 4
|
|
//
|
|
|
|
wxUint32 Load8bI (wxUIntPtr dst, wxUIntPtr src, int wid_64, int height, int line, int real_width, int tile)
|
|
{
|
|
if (rdp.tlut_mode != 0)
|
|
return Load8bCI (dst, src, wid_64, height, line, real_width, tile);
|
|
|
|
if (wid_64 < 1) wid_64 = 1;
|
|
if (height < 1) height = 1;
|
|
int ext = (real_width - (wid_64 << 3));
|
|
asmLoad8bI (src, dst, wid_64, height, line, ext);
|
|
return /*(0 << 16) | */GR_TEXFMT_ALPHA_8;
|
|
}
|