mirror of https://github.com/PCSX2/pcsx2.git
175 lines
9.7 KiB
C
175 lines
9.7 KiB
C
|
/* ZZ Open GL graphics plugin
|
||
|
* Copyright (c)2009-2010 zeydlitz@gmail.com, arcum42@gmail.com
|
||
|
* Based on Zerofrog's ZeroGS KOSMOS (c)2005-2008
|
||
|
*
|
||
|
* This program is free software; you can redistribute it and/or modify
|
||
|
* it under the terms of the GNU General Public License as published by
|
||
|
* the Free Software Foundation; either version 2 of the License, or
|
||
|
* (at your option) any later version.
|
||
|
*
|
||
|
* This program is distributed in the hope that it will be useful,
|
||
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||
|
* GNU General Public License for more details.
|
||
|
*
|
||
|
* You should have received a copy of the GNU General Public License
|
||
|
* along with this program; if not, write to the Free Software
|
||
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA
|
||
|
*/
|
||
|
|
||
|
#ifndef ZEROGS_X86
|
||
|
#define ZEROGS_X86
|
||
|
|
||
|
#include "GS.h"
|
||
|
|
||
|
extern "C" void __fastcall SwizzleBlock32_sse2(u8* dst, u8* src, int srcpitch, u32 WriteMask = 0xffffffff);
|
||
|
extern "C" void __fastcall SwizzleBlock16_sse2(u8* dst, u8* src, int srcpitch);
|
||
|
extern "C" void __fastcall SwizzleBlock8_sse2(u8* dst, u8* src, int srcpitch);
|
||
|
extern "C" void __fastcall SwizzleBlock4_sse2(u8* dst, u8* src, int srcpitch);
|
||
|
extern "C" void __fastcall SwizzleBlock32u_sse2(u8* dst, u8* src, int srcpitch, u32 WriteMask = 0xffffffff);
|
||
|
extern "C" void __fastcall SwizzleBlock16u_sse2(u8* dst, u8* src, int srcpitch);
|
||
|
extern "C" void __fastcall SwizzleBlock8u_sse2(u8* dst, u8* src, int srcpitch);
|
||
|
extern "C" void __fastcall SwizzleBlock4u_sse2(u8* dst, u8* src, int srcpitch);
|
||
|
|
||
|
// frame swizzling
|
||
|
|
||
|
#if 0
|
||
|
// no AA
|
||
|
extern "C" void __fastcall FrameSwizzleBlock32_sse2(u32* dst, u32* src, int srcpitch, u32 WriteMask);
|
||
|
extern "C" void __fastcall FrameSwizzleBlock16_sse2(u16* dst, u32* src, int srcpitch, u32 WriteMask);
|
||
|
extern "C" void __fastcall Frame16SwizzleBlock32_sse2(u32* dst, Vector_16F* src, int srcpitch, u32 WriteMask);
|
||
|
extern "C" void __fastcall Frame16SwizzleBlock32Z_sse2(u32* dst, Vector_16F* src, int srcpitch, u32 WriteMask);
|
||
|
extern "C" void __fastcall Frame16SwizzleBlock16_sse2(u16* dst, Vector_16F* src, int srcpitch, u32 WriteMask);
|
||
|
extern "C" void __fastcall Frame16SwizzleBlock16Z_sse2(u16* dst, Vector_16F* src, int srcpitch, u32 WriteMask);
|
||
|
|
||
|
// AA 2x
|
||
|
extern "C" void __fastcall FrameSwizzleBlock32A2_sse2(u32* dst, u32* src, int srcpitch, u32 WriteMask);
|
||
|
extern "C" void __fastcall FrameSwizzleBlock16A2_sse2(u16* dst, u32* src, int srcpitch, u32 WriteMask);
|
||
|
extern "C" void __fastcall Frame16SwizzleBlock32A2_sse2(u32* dst, Vector_16F* src, int srcpitch, u32 WriteMask);
|
||
|
extern "C" void __fastcall Frame16SwizzleBlock32ZA2_sse2(u32* dst, Vector_16F* src, int srcpitch, u32 WriteMask);
|
||
|
extern "C" void __fastcall Frame16SwizzleBlock16A2_sse2(u16* dst, Vector_16F* src, int srcpitch, u32 WriteMask);
|
||
|
extern "C" void __fastcall Frame16SwizzleBlock16ZA2_sse2(u16* dst, Vector_16F* src, int srcpitch, u32 WriteMask);
|
||
|
|
||
|
// AA 4x
|
||
|
extern "C" void __fastcall FrameSwizzleBlock32A4_sse2(u32* dst, u32* src, int srcpitch, u32 WriteMask);
|
||
|
extern "C" void __fastcall FrameSwizzleBlock16A4_sse2(u16* dst, u32* src, int srcpitch, u32 WriteMask);
|
||
|
extern "C" void __fastcall Frame16SwizzleBlock32A4_sse2(u32* dst, Vector_16F* src, int srcpitch, u32 WriteMask);
|
||
|
extern "C" void __fastcall Frame16SwizzleBlock32ZA4_sse2(u32* dst, Vector_16F* src, int srcpitch, u32 WriteMask);
|
||
|
extern "C" void __fastcall Frame16SwizzleBlock16A4_sse2(u16* dst, Vector_16F* src, int srcpitch, u32 WriteMask);
|
||
|
extern "C" void __fastcall Frame16SwizzleBlock16ZA4_sse2(u16* dst, Vector_16F* src, int srcpitch, u32 WriteMask);
|
||
|
|
||
|
/*extern void __fastcall SwizzleBlock32_c(u8* dst, u8* src, int srcpitch, u32 WriteMask = 0xffffffff);
|
||
|
extern void __fastcall SwizzleBlock16_c(u8* dst, u8* src, int srcpitch);
|
||
|
extern void __fastcall SwizzleBlock8_c(u8* dst, u8* src, int srcpitch);
|
||
|
extern void __fastcall SwizzleBlock4_c(u8* dst, u8* src, int srcpitch);*/
|
||
|
|
||
|
// no AA
|
||
|
extern void __fastcall FrameSwizzleBlock32_c(u32* dst, u32* src, int srcpitch, u32 WriteMask);
|
||
|
extern void __fastcall FrameSwizzleBlock24_c(u32* dst, u32* src, int srcpitch, u32 WriteMask);
|
||
|
extern void __fastcall FrameSwizzleBlock16_c(u16* dst, u32* src, int srcpitch, u32 WriteMask);
|
||
|
extern void __fastcall Frame16SwizzleBlock32_c(u32* dst, Vector_16F* src, int srcpitch, u32 WriteMask);
|
||
|
extern void __fastcall Frame16SwizzleBlock32Z_c(u32* dst, Vector_16F* src, int srcpitch, u32 WriteMask);
|
||
|
extern void __fastcall Frame16SwizzleBlock16_c(u16* dst, Vector_16F* src, int srcpitch, u32 WriteMask);
|
||
|
extern void __fastcall Frame16SwizzleBlock16Z_c(u16* dst, Vector_16F* src, int srcpitch, u32 WriteMask);
|
||
|
|
||
|
// AA 2x
|
||
|
extern void __fastcall FrameSwizzleBlock32A2_c(u32* dst, u32* src, int srcpitch, u32 WriteMask);
|
||
|
extern void __fastcall FrameSwizzleBlock24A2_c(u32* dst, u32* src, int srcpitch, u32 WriteMask);
|
||
|
extern void __fastcall FrameSwizzleBlock16A2_c(u16* dst, u32* src, int srcpitch, u32 WriteMask);
|
||
|
extern void __fastcall Frame16SwizzleBlock32A2_c(u32* dst, Vector_16F* src, int srcpitch, u32 WriteMask);
|
||
|
extern void __fastcall Frame16SwizzleBlock32ZA2_c(u32* dst, Vector_16F* src, int srcpitch, u32 WriteMask);
|
||
|
extern void __fastcall Frame16SwizzleBlock16A2_c(u16* dst, Vector_16F* src, int srcpitch, u32 WriteMask);
|
||
|
extern void __fastcall Frame16SwizzleBlock16ZA2_c(u16* dst, Vector_16F* src, int srcpitch, u32 WriteMask);
|
||
|
|
||
|
// AA 4x
|
||
|
extern void __fastcall FrameSwizzleBlock32A4_c(u32* dst, u32* src, int srcpitch, u32 WriteMask);
|
||
|
extern void __fastcall FrameSwizzleBlock24A4_c(u32* dst, u32* src, int srcpitch, u32 WriteMask);
|
||
|
extern void __fastcall FrameSwizzleBlock16A4_c(u16* dst, u32* src, int srcpitch, u32 WriteMask);
|
||
|
extern void __fastcall Frame16SwizzleBlock32A4_c(u32* dst, Vector_16F* src, int srcpitch, u32 WriteMask);
|
||
|
extern void __fastcall Frame16SwizzleBlock32ZA4_c(u32* dst, Vector_16F* src, int srcpitch, u32 WriteMask);
|
||
|
extern void __fastcall Frame16SwizzleBlock16A4_c(u16* dst, Vector_16F* src, int srcpitch, u32 WriteMask);
|
||
|
extern void __fastcall Frame16SwizzleBlock16ZA4_c(u16* dst, Vector_16F* src, int srcpitch, u32 WriteMask);
|
||
|
#endif
|
||
|
|
||
|
extern void __fastcall SwizzleColumn32_c(int y, u8* dst, u8* src, int srcpitch, u32 WriteMask = 0xffffffff);
|
||
|
extern void __fastcall SwizzleColumn16_c(int y, u8* dst, u8* src, int srcpitch);
|
||
|
extern void __fastcall SwizzleColumn8_c(int y, u8* dst, u8* src, int srcpitch);
|
||
|
extern void __fastcall SwizzleColumn4_c(int y, u8* dst, u8* src, int srcpitch);
|
||
|
|
||
|
// extern "C" void __fastcall WriteCLUT_T16_I8_CSM1_sse2(u32* vm, u32* clut);
|
||
|
extern "C" void __fastcall WriteCLUT_T16_I8_CSM1_sse2(u32* vm, u32 csa);
|
||
|
extern "C" void __fastcall WriteCLUT_T32_I8_CSM1_sse2(u32* vm, u32* clut);
|
||
|
// extern "C" void __fastcall WriteCLUT_T16_I4_CSM1_sse2(u32* vm, u32* clut);
|
||
|
extern "C" void __fastcall WriteCLUT_T16_I4_CSM1_sse2(u32* vm, u32 csa);
|
||
|
extern "C" void __fastcall WriteCLUT_T32_I4_CSM1_sse2(u32* vm, u32* clut);
|
||
|
extern void __fastcall WriteCLUT_T16_I8_CSM1_c(u32* vm, u32* clut);
|
||
|
extern void __fastcall WriteCLUT_T32_I8_CSM1_c(u32* vm, u32* clut);
|
||
|
|
||
|
extern void __fastcall WriteCLUT_T16_I4_CSM1_c(u32* vm, u32* clut);
|
||
|
extern void __fastcall WriteCLUT_T32_I4_CSM1_c(u32* vm, u32* clut);
|
||
|
|
||
|
extern void SSE2_UnswizzleZ16Target(u16* dst, u16* src, int iters);
|
||
|
|
||
|
#ifdef ZEROGS_SSE2
|
||
|
|
||
|
#define FrameSwizzleBlock32 FrameSwizzleBlock32_c
|
||
|
#define FrameSwizzleBlock24 FrameSwizzleBlock24_c
|
||
|
#define FrameSwizzleBlock16 FrameSwizzleBlock16_c
|
||
|
#define Frame16SwizzleBlock32 Frame16SwizzleBlock32_c
|
||
|
#define Frame16SwizzleBlock32Z Frame16SwizzleBlock32Z_c
|
||
|
#define Frame16SwizzleBlock16 Frame16SwizzleBlock16_c
|
||
|
#define Frame16SwizzleBlock16Z Frame16SwizzleBlock16Z_c
|
||
|
|
||
|
#define FrameSwizzleBlock32A2 FrameSwizzleBlock32A2_c
|
||
|
#define FrameSwizzleBlock24A2 FrameSwizzleBlock24A2_c
|
||
|
#define FrameSwizzleBlock16A2 FrameSwizzleBlock16A2_c
|
||
|
#define Frame16SwizzleBlock32A2 Frame16SwizzleBlock32A2_c
|
||
|
#define Frame16SwizzleBlock32ZA2 Frame16SwizzleBlock32ZA2_c
|
||
|
#define Frame16SwizzleBlock16A2 Frame16SwizzleBlock16A2_c
|
||
|
#define Frame16SwizzleBlock16ZA2 Frame16SwizzleBlock16ZA2_c
|
||
|
|
||
|
#define FrameSwizzleBlock32A4 FrameSwizzleBlock32A4_c
|
||
|
#define FrameSwizzleBlock24A4 FrameSwizzleBlock24A4_c
|
||
|
#define FrameSwizzleBlock16A4 FrameSwizzleBlock16A4_c
|
||
|
#define Frame16SwizzleBlock32A4 Frame16SwizzleBlock32A4_c
|
||
|
#define Frame16SwizzleBlock32ZA4 Frame16SwizzleBlock32ZA4_c
|
||
|
#define Frame16SwizzleBlock16A4 Frame16SwizzleBlock16A4_c
|
||
|
#define Frame16SwizzleBlock16ZA4 Frame16SwizzleBlock16ZA4_c
|
||
|
|
||
|
#define WriteCLUT_T16_I8_CSM1 WriteCLUT_T16_I8_CSM1_sse2
|
||
|
#define WriteCLUT_T32_I8_CSM1 WriteCLUT_T32_I8_CSM1_sse2
|
||
|
#define WriteCLUT_T16_I4_CSM1 WriteCLUT_T16_I4_CSM1_sse2
|
||
|
#define WriteCLUT_T32_I4_CSM1 WriteCLUT_T32_I4_CSM1_sse2
|
||
|
|
||
|
#else
|
||
|
|
||
|
#define FrameSwizzleBlock32 FrameSwizzleBlock32_c
|
||
|
#define FrameSwizzleBlock16 FrameSwizzleBlock16_c
|
||
|
#define Frame16SwizzleBlock32 Frame16SwizzleBlock32_c
|
||
|
#define Frame16SwizzleBlock32Z Frame16SwizzleBlock32Z_c
|
||
|
#define Frame16SwizzleBlock16 Frame16SwizzleBlock16_c
|
||
|
#define Frame16SwizzleBlock16Z Frame16SwizzleBlock16Z_c
|
||
|
|
||
|
#define FrameSwizzleBlock32A2 FrameSwizzleBlock32A2_c
|
||
|
#define FrameSwizzleBlock16A2 FrameSwizzleBlock16A2_c
|
||
|
#define Frame16SwizzleBlock32A2 Frame16SwizzleBlock32A2_c
|
||
|
#define Frame16SwizzleBlock32ZA2 Frame16SwizzleBlock32ZA2_c
|
||
|
#define Frame16SwizzleBlock16A2 Frame16SwizzleBlock16A2_c
|
||
|
#define Frame16SwizzleBlock16ZA2 Frame16SwizzleBlock16ZA2_c
|
||
|
|
||
|
#define FrameSwizzleBlock32A4 FrameSwizzleBlock32A4_c
|
||
|
#define FrameSwizzleBlock16A4 FrameSwizzleBlock16A4_c
|
||
|
#define Frame16SwizzleBlock32A4 Frame16SwizzleBlock32A4_c
|
||
|
#define Frame16SwizzleBlock32ZA4 Frame16SwizzleBlock32ZA4_c
|
||
|
#define Frame16SwizzleBlock16A4 Frame16SwizzleBlock16A4_c
|
||
|
#define Frame16SwizzleBlock16ZA4 Frame16SwizzleBlock16ZA4_c
|
||
|
|
||
|
#define WriteCLUT_T16_I8_CSM1 WriteCLUT_T16_I8_CSM1_c
|
||
|
#define WriteCLUT_T32_I8_CSM1 WriteCLUT_T32_I8_CSM1_c
|
||
|
#define WriteCLUT_T16_I4_CSM1 WriteCLUT_T16_I4_CSM1_c
|
||
|
#define WriteCLUT_T32_I4_CSM1 WriteCLUT_T32_I4_CSM1_c
|
||
|
|
||
|
#endif
|
||
|
|
||
|
#endif
|