2010-04-25 00:31:27 +00:00
|
|
|
/*
|
2010-04-24 21:37:39 +00:00
|
|
|
* Copyright (C) 2007-2009 Gabest
|
|
|
|
* http://www.gabest.org
|
|
|
|
*
|
|
|
|
* This Program is free software; you can redistribute it and/or modify
|
|
|
|
* it under the terms of the GNU General Public License as published by
|
|
|
|
* the Free Software Foundation; either version 2, or (at your option)
|
|
|
|
* any later version.
|
2010-04-25 00:31:27 +00:00
|
|
|
*
|
2010-04-24 21:37:39 +00:00
|
|
|
* This Program is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
* GNU General Public License for more details.
|
2010-04-25 00:31:27 +00:00
|
|
|
*
|
2010-04-24 21:37:39 +00:00
|
|
|
* You should have received a copy of the GNU General Public License
|
|
|
|
* along with GNU Make; see the file COPYING. If not, write to
|
2012-09-09 18:16:11 +00:00
|
|
|
* the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA USA.
|
2010-04-24 21:37:39 +00:00
|
|
|
* http://www.gnu.org/copyleft/gpl.html
|
|
|
|
*
|
|
|
|
*/
|
|
|
|
|
|
|
|
#pragma once
|
|
|
|
|
|
|
|
#include "GSScanlineEnvironment.h"
|
2018-11-16 18:41:37 +00:00
|
|
|
#include "Renderers/Common/GSFunctionMap.h"
|
2016-11-19 13:17:38 +00:00
|
|
|
#include "GSUtil.h"
|
2010-04-24 21:37:39 +00:00
|
|
|
|
|
|
|
using namespace Xbyak;
|
|
|
|
|
2016-11-19 13:47:40 +00:00
|
|
|
#if defined(_M_AMD64) || defined(_WIN64)
|
|
|
|
#define RegLong Reg64
|
|
|
|
#else
|
|
|
|
#define RegLong Reg32
|
|
|
|
#endif
|
|
|
|
|
2011-02-16 03:19:36 +00:00
|
|
|
class GSDrawScanlineCodeGenerator : public GSCodeGenerator
|
2010-04-24 21:37:39 +00:00
|
|
|
{
|
|
|
|
void operator = (const GSDrawScanlineCodeGenerator&);
|
|
|
|
|
|
|
|
GSScanlineSelector m_sel;
|
2011-02-17 03:24:37 +00:00
|
|
|
GSScanlineLocalData& m_local;
|
2016-11-20 16:29:11 +00:00
|
|
|
bool m_rip;
|
2010-04-24 21:37:39 +00:00
|
|
|
|
|
|
|
void Generate();
|
|
|
|
|
2013-06-20 05:07:52 +00:00
|
|
|
#if _M_SSE >= 0x501
|
|
|
|
|
|
|
|
void Init();
|
|
|
|
void Step();
|
|
|
|
void TestZ(const Ymm& temp1, const Ymm& temp2);
|
|
|
|
void SampleTexture();
|
|
|
|
void Wrap(const Ymm& uv0);
|
|
|
|
void Wrap(const Ymm& uv0, const Ymm& uv1);
|
|
|
|
void SampleTextureLOD();
|
|
|
|
void WrapLOD(const Ymm& uv0);
|
|
|
|
void WrapLOD(const Ymm& uv0, const Ymm& uv1);
|
|
|
|
void AlphaTFX();
|
|
|
|
void ReadMask();
|
|
|
|
void TestAlpha();
|
|
|
|
void ColorTFX();
|
|
|
|
void Fog();
|
|
|
|
void ReadFrame();
|
|
|
|
void TestDestAlpha();
|
|
|
|
void WriteMask();
|
|
|
|
void WriteZBuf();
|
|
|
|
void AlphaBlend();
|
|
|
|
void WriteFrame();
|
2016-11-19 13:47:40 +00:00
|
|
|
void ReadPixel(const Ymm& dst, const Ymm& temp, const RegLong& addr);
|
|
|
|
void WritePixel(const Ymm& src, const Ymm& temp, const RegLong& addr, const Reg32& mask, bool fast, int psm, int fz);
|
|
|
|
void WritePixel(const Xmm& src, const RegLong& addr, uint8 i, uint8 j, int psm);
|
2013-06-20 05:07:52 +00:00
|
|
|
void ReadTexel(int pixels, int mip_offset = 0);
|
|
|
|
void ReadTexel(const Ymm& dst, const Ymm& addr, uint8 i);
|
|
|
|
|
|
|
|
#else
|
|
|
|
|
2016-11-19 13:47:40 +00:00
|
|
|
void Generate_SSE();
|
|
|
|
void Init_SSE();
|
|
|
|
void Step_SSE();
|
|
|
|
void TestZ_SSE(const Xmm& temp1, const Xmm& temp2);
|
|
|
|
void SampleTexture_SSE();
|
|
|
|
void Wrap_SSE(const Xmm& uv0);
|
|
|
|
void Wrap_SSE(const Xmm& uv0, const Xmm& uv1);
|
|
|
|
void SampleTextureLOD_SSE();
|
|
|
|
void WrapLOD_SSE(const Xmm& uv0);
|
|
|
|
void WrapLOD_SSE(const Xmm& uv0, const Xmm& uv1);
|
|
|
|
void AlphaTFX_SSE();
|
|
|
|
void ReadMask_SSE();
|
|
|
|
void TestAlpha_SSE();
|
|
|
|
void ColorTFX_SSE();
|
|
|
|
void Fog_SSE();
|
|
|
|
void ReadFrame_SSE();
|
|
|
|
void TestDestAlpha_SSE();
|
|
|
|
void WriteMask_SSE();
|
|
|
|
void WriteZBuf_SSE();
|
|
|
|
void AlphaBlend_SSE();
|
|
|
|
void WriteFrame_SSE();
|
|
|
|
void ReadPixel_SSE(const Xmm& dst, const RegLong& addr);
|
|
|
|
void WritePixel_SSE(const Xmm& src, const RegLong& addr, const Reg8& mask, bool fast, int psm, int fz);
|
|
|
|
void WritePixel_SSE(const Xmm& src, const RegLong& addr, uint8 i, int psm);
|
|
|
|
void ReadTexel_SSE(int pixels, int mip_offset = 0);
|
|
|
|
void ReadTexel_SSE(const Xmm& dst, const Xmm& addr, uint8 i);
|
|
|
|
|
|
|
|
void Generate_AVX();
|
|
|
|
void Init_AVX();
|
|
|
|
void Step_AVX();
|
|
|
|
void TestZ_AVX(const Xmm& temp1, const Xmm& temp2);
|
|
|
|
void SampleTexture_AVX();
|
|
|
|
void Wrap_AVX(const Xmm& uv0);
|
|
|
|
void Wrap_AVX(const Xmm& uv0, const Xmm& uv1);
|
|
|
|
void SampleTextureLOD_AVX();
|
|
|
|
void WrapLOD_AVX(const Xmm& uv0);
|
|
|
|
void WrapLOD_AVX(const Xmm& uv0, const Xmm& uv1);
|
|
|
|
void AlphaTFX_AVX();
|
|
|
|
void ReadMask_AVX();
|
|
|
|
void TestAlpha_AVX();
|
|
|
|
void ColorTFX_AVX();
|
|
|
|
void Fog_AVX();
|
|
|
|
void ReadFrame_AVX();
|
|
|
|
void TestDestAlpha_AVX();
|
|
|
|
void WriteMask_AVX();
|
|
|
|
void WriteZBuf_AVX();
|
|
|
|
void AlphaBlend_AVX();
|
|
|
|
void WriteFrame_AVX();
|
|
|
|
void ReadPixel_AVX(const Xmm& dst, const RegLong& addr);
|
|
|
|
void WritePixel_AVX(const Xmm& src, const RegLong& addr, const Reg8& mask, bool fast, int psm, int fz);
|
|
|
|
void WritePixel_AVX(const Xmm& src, const RegLong& addr, uint8 i, int psm);
|
|
|
|
void ReadTexel_AVX(int pixels, int mip_offset = 0);
|
|
|
|
void ReadTexel_AVX(const Xmm& dst, const Xmm& addr, uint8 i);
|
2010-04-24 21:37:39 +00:00
|
|
|
|
2016-11-22 06:43:02 +00:00
|
|
|
#endif
|
|
|
|
|
|
|
|
void modulate16(const Xmm& a, const Operand& f, uint8 shift);
|
|
|
|
void lerp16(const Xmm& a, const Xmm& b, const Xmm& f, uint8 shift);
|
2012-02-12 17:56:06 +00:00
|
|
|
void lerp16_4(const Xmm& a, const Xmm& b, const Xmm& f);
|
2010-04-24 21:37:39 +00:00
|
|
|
void mix16(const Xmm& a, const Xmm& b, const Xmm& temp);
|
|
|
|
void clamp16(const Xmm& a, const Xmm& temp);
|
2016-11-22 06:43:02 +00:00
|
|
|
void alltrue(const Xmm& test);
|
2010-04-24 21:37:39 +00:00
|
|
|
void blend(const Xmm& a, const Xmm& b, const Xmm& mask);
|
|
|
|
void blendr(const Xmm& b, const Xmm& a, const Xmm& mask);
|
2011-02-07 01:59:05 +00:00
|
|
|
void blend8(const Xmm& a, const Xmm& b);
|
|
|
|
void blend8r(const Xmm& b, const Xmm& a);
|
2016-11-18 21:48:06 +00:00
|
|
|
void split16_2x8(const Xmm& l, const Xmm& h, const Xmm& src);
|
2010-04-24 21:37:39 +00:00
|
|
|
|
|
|
|
public:
|
2011-02-16 03:19:36 +00:00
|
|
|
GSDrawScanlineCodeGenerator(void* param, uint64 key, void* code, size_t maxsize);
|
2010-04-25 00:31:27 +00:00
|
|
|
};
|