2010-04-25 00:31:27 +00:00
|
|
|
/*
|
2009-06-27 03:32:33 +00:00
|
|
|
* Copyright (C) 2007-2009 Gabest
|
|
|
|
* http://www.gabest.org
|
|
|
|
*
|
|
|
|
* This Program is free software; you can redistribute it and/or modify
|
|
|
|
* it under the terms of the GNU General Public License as published by
|
|
|
|
* the Free Software Foundation; either version 2, or (at your option)
|
|
|
|
* any later version.
|
2010-04-25 00:31:27 +00:00
|
|
|
*
|
2009-06-27 03:32:33 +00:00
|
|
|
* This Program is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
* GNU General Public License for more details.
|
2010-04-25 00:31:27 +00:00
|
|
|
*
|
2009-06-27 03:32:33 +00:00
|
|
|
* You should have received a copy of the GNU General Public License
|
|
|
|
* along with GNU Make; see the file COPYING. If not, write to
|
2012-09-09 18:16:11 +00:00
|
|
|
* the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA USA.
|
2009-06-27 03:32:33 +00:00
|
|
|
* http://www.gnu.org/copyleft/gpl.html
|
|
|
|
*
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include "stdafx.h"
|
|
|
|
#include "GSRendererDX9.h"
|
|
|
|
#include "GSCrc.h"
|
|
|
|
#include "resource.h"
|
|
|
|
|
2009-09-18 19:54:56 +00:00
|
|
|
GSRendererDX9::GSRendererDX9()
|
2012-01-19 04:53:36 +00:00
|
|
|
: GSRendererDX(new GSTextureCache9(this))
|
2009-06-27 03:32:33 +00:00
|
|
|
{
|
|
|
|
}
|
|
|
|
|
2009-09-17 07:40:38 +00:00
|
|
|
bool GSRendererDX9::CreateDevice(GSDevice* dev)
|
2009-06-27 03:32:33 +00:00
|
|
|
{
|
2009-09-17 07:40:38 +00:00
|
|
|
if(!__super::CreateDevice(dev))
|
2009-06-27 03:32:33 +00:00
|
|
|
return false;
|
|
|
|
|
|
|
|
//
|
|
|
|
|
|
|
|
memset(&m_fba.dss, 0, sizeof(m_fba.dss));
|
|
|
|
|
|
|
|
m_fba.dss.StencilEnable = true;
|
|
|
|
m_fba.dss.StencilReadMask = 2;
|
|
|
|
m_fba.dss.StencilWriteMask = 2;
|
|
|
|
m_fba.dss.StencilFunc = D3DCMP_EQUAL;
|
|
|
|
m_fba.dss.StencilPassOp = D3DSTENCILOP_ZERO;
|
|
|
|
m_fba.dss.StencilFailOp = D3DSTENCILOP_ZERO;
|
|
|
|
m_fba.dss.StencilDepthFailOp = D3DSTENCILOP_ZERO;
|
|
|
|
m_fba.dss.StencilRef = 2;
|
|
|
|
|
|
|
|
memset(&m_fba.bs, 0, sizeof(m_fba.bs));
|
|
|
|
|
|
|
|
m_fba.bs.RenderTargetWriteMask = D3DCOLORWRITEENABLE_ALPHA;
|
|
|
|
|
|
|
|
//
|
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
GSdx-D3D: Texture and channel shuffle improvements.
Texture Shuffle changes:
Always Enable Texture shuffle on D3D10/11.
Previously Texture shuffle was enabled if CRC hack
level was below Full, this was kinda not good since
D3D also relies on CRC hacks on Full so you could either
stick with texture shuffle or crc hacks.
Texture shuffle is not supported on D3D9, however we can do a partial
port where instead of vertical lines with the effect we get the effect
on the entire screen. Better than nothing I suppose.
Ported some of the code from OpenGL to D3D
( just a copy - paste job :) ),
part of the code misses a dedicated shader but we can still
use it to fix various issues on many games.
List of affected games tested so far:
The Godfather, Final Fight Streetwise, The Suffering Ties that Bind,
Urban Chaos have their vertical lines issues fixed
(highly possible for other games as well), MGS and Stolen see an improvement
but they are still broken without crc hacks. Other games that suffered
similar issues are probably affected as well.
Channel Shuffle changes:
Update Channel Shuffle detection. A lot of games should see an improvement,
MGS, Urban Chaos, Stolen have their top left corner issues resolved.
Other games should be affected as well that use similar logic.
They still miss a shader so some effects are still broken/show glitches
but it's a nice improvement for D3D users.
Shared changes:
Texture Shuffle and Channel shuffle have been moved to their
own dedicated functions. Should make things a bit cleaner.
Move part of the code for Texture Shuffle to GSRendererHW to be shared
across all HW renderers, should aboid copy paste/duplicate code.
2018-03-18 09:08:36 +00:00
|
|
|
void GSRendererDX9::EmulateTextureShuffleAndFbmask()
|
|
|
|
{
|
|
|
|
if (m_texture_shuffle) {
|
|
|
|
// We can do a partial port for D3D9 that skips the draw call to give it a slight improvement.
|
|
|
|
// It's still broken but more bearable. Broken effect is on the screen but fully instead of vertical lines.
|
|
|
|
throw GSDXRecoverableError();
|
|
|
|
} else {
|
|
|
|
om_bsel.wrgba = ~GSVector4i::load((int)m_context->FRAME.FBMSK).eq8(GSVector4i::xffffffff()).mask();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-03-03 21:18:49 +00:00
|
|
|
void GSRendererDX9::SetupIA(const float& sx, const float& sy)
|
2012-01-05 02:40:24 +00:00
|
|
|
{
|
2012-01-19 04:53:36 +00:00
|
|
|
D3DPRIMITIVETYPE topology;
|
|
|
|
|
|
|
|
switch(m_vt.m_primclass)
|
2011-02-07 01:59:05 +00:00
|
|
|
{
|
2012-01-05 02:40:24 +00:00
|
|
|
case GS_POINT_CLASS:
|
|
|
|
|
2012-01-19 04:53:36 +00:00
|
|
|
topology = D3DPT_POINTLIST;
|
2012-01-05 02:40:24 +00:00
|
|
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
case GS_LINE_CLASS:
|
2009-06-27 03:32:33 +00:00
|
|
|
|
2012-01-19 04:53:36 +00:00
|
|
|
topology = D3DPT_LINELIST;
|
2009-06-27 03:32:33 +00:00
|
|
|
|
2012-01-05 02:40:24 +00:00
|
|
|
if(PRIM->IIP == 0)
|
2011-02-07 01:59:05 +00:00
|
|
|
{
|
2012-01-05 02:40:24 +00:00
|
|
|
for(size_t i = 0, j = m_index.tail; i < j; i += 2)
|
|
|
|
{
|
|
|
|
uint32 tmp = m_index.buff[i + 0];
|
|
|
|
m_index.buff[i + 0] = m_index.buff[i + 1];
|
|
|
|
m_index.buff[i + 1] = tmp;
|
|
|
|
}
|
2011-02-07 01:59:05 +00:00
|
|
|
}
|
2009-06-27 03:32:33 +00:00
|
|
|
|
2012-01-05 02:40:24 +00:00
|
|
|
break;
|
|
|
|
|
|
|
|
case GS_TRIANGLE_CLASS:
|
|
|
|
|
2012-01-19 04:53:36 +00:00
|
|
|
topology = D3DPT_TRIANGLELIST;
|
2009-07-16 21:36:07 +00:00
|
|
|
|
2012-01-05 02:40:24 +00:00
|
|
|
if(PRIM->IIP == 0)
|
2011-02-07 01:59:05 +00:00
|
|
|
{
|
2012-01-05 02:40:24 +00:00
|
|
|
for(size_t i = 0, j = m_index.tail; i < j; i += 3)
|
|
|
|
{
|
|
|
|
uint32 tmp = m_index.buff[i + 0];
|
|
|
|
m_index.buff[i + 0] = m_index.buff[i + 2];
|
|
|
|
m_index.buff[i + 2] = tmp;
|
|
|
|
}
|
2011-02-07 01:59:05 +00:00
|
|
|
}
|
2009-06-27 03:32:33 +00:00
|
|
|
|
2012-01-05 02:40:24 +00:00
|
|
|
break;
|
|
|
|
|
|
|
|
case GS_SPRITE_CLASS:
|
|
|
|
|
2012-01-19 04:53:36 +00:00
|
|
|
topology = D3DPT_TRIANGLELIST;
|
2012-01-05 02:40:24 +00:00
|
|
|
|
|
|
|
// each sprite converted to quad needs twice the space
|
|
|
|
|
2017-03-03 21:18:49 +00:00
|
|
|
Lines2Sprites();
|
2009-06-27 03:32:33 +00:00
|
|
|
|
|
|
|
break;
|
2012-01-05 02:40:24 +00:00
|
|
|
|
2009-06-27 03:32:33 +00:00
|
|
|
default:
|
|
|
|
__assume(0);
|
|
|
|
}
|
|
|
|
|
2012-01-19 04:53:36 +00:00
|
|
|
GSDevice9* dev = (GSDevice9*)m_dev;
|
|
|
|
|
|
|
|
(*dev)->SetRenderState(D3DRS_SHADEMODE, PRIM->IIP ? D3DSHADE_GOURAUD : D3DSHADE_FLAT); // TODO
|
|
|
|
|
|
|
|
void* ptr = NULL;
|
|
|
|
|
|
|
|
if(dev->IAMapVertexBuffer(&ptr, sizeof(GSVertexHW9), m_vertex.next))
|
|
|
|
{
|
|
|
|
GSVertex* RESTRICT s = (GSVertex*)m_vertex.buff;
|
|
|
|
GSVertexHW9* RESTRICT d = (GSVertexHW9*)ptr;
|
|
|
|
|
2014-01-26 00:58:21 +00:00
|
|
|
for(uint32 i = 0; i < m_vertex.next; i++, s++, d++)
|
2012-01-19 04:53:36 +00:00
|
|
|
{
|
|
|
|
GSVector4 p = GSVector4(GSVector4i::load(s->XYZ.u32[0]).upl16());
|
|
|
|
|
|
|
|
if(PRIM->TME && !PRIM->FST)
|
|
|
|
{
|
|
|
|
p = p.xyxy(GSVector4((float)s->XYZ.Z, s->RGBAQ.Q));
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
p = p.xyxy(GSVector4::load((float)s->XYZ.Z));
|
|
|
|
}
|
|
|
|
|
|
|
|
GSVector4 t = GSVector4::zero();
|
|
|
|
|
|
|
|
if(PRIM->TME)
|
|
|
|
{
|
|
|
|
if(PRIM->FST)
|
|
|
|
{
|
2013-02-12 10:57:48 +00:00
|
|
|
if(UserHacks_WildHack && !isPackedUV_HackFlag)
|
|
|
|
{
|
|
|
|
t = GSVector4(GSVector4i::load(s->UV & 0x3FEF3FEF).upl16());
|
|
|
|
//printf("GSDX: %08X | D3D9(%d) %s\n", s->UV & 0x3FEF3FEF, m_vertex.next, i == 0 ? "*" : "");
|
|
|
|
}
|
|
|
|
else
|
GSdx:
- changed the KH2 fix in GetTextureMinMax to my taste, should give the same results, when the used texture rect is to the left/above the clamped area, it returns [min, min+1], and [max-1, max] for right/below
- m_mem.m_clut.Read32 was returned to its original place from GetAlphaMinMax
- UserHacks_WildHack was moved up to GSState, special UV handlers are only used when this setting is active
- updated xbyak to the latest available (avx2 seems incomplete, the 256-bit promoted old instructions are missing)
- changed vtune's include path to the 2013 edition
Some other not yet commited changes from a year ago:
- WriteImageX overflow crash-fix
- moved colclamp after dithering (sw mode), it makes more sense, no visible changes noticed
- Gif_Tag::analyzeTag(), there was a conditional I didn't like, split the loop into two parts
git-svn-id: http://pcsx2.googlecode.com/svn/trunk@5649 96395faa-99c1-11dd-bbfe-3dabce05a288
2013-06-06 11:36:01 +00:00
|
|
|
{
|
2013-02-12 10:57:48 +00:00
|
|
|
t = GSVector4(GSVector4i::load(s->UV).upl16());
|
GSdx:
- changed the KH2 fix in GetTextureMinMax to my taste, should give the same results, when the used texture rect is to the left/above the clamped area, it returns [min, min+1], and [max-1, max] for right/below
- m_mem.m_clut.Read32 was returned to its original place from GetAlphaMinMax
- UserHacks_WildHack was moved up to GSState, special UV handlers are only used when this setting is active
- updated xbyak to the latest available (avx2 seems incomplete, the 256-bit promoted old instructions are missing)
- changed vtune's include path to the 2013 edition
Some other not yet commited changes from a year ago:
- WriteImageX overflow crash-fix
- moved colclamp after dithering (sw mode), it makes more sense, no visible changes noticed
- Gif_Tag::analyzeTag(), there was a conditional I didn't like, split the loop into two parts
git-svn-id: http://pcsx2.googlecode.com/svn/trunk@5649 96395faa-99c1-11dd-bbfe-3dabce05a288
2013-06-06 11:36:01 +00:00
|
|
|
}
|
2012-01-19 04:53:36 +00:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
t = GSVector4::loadl(&s->ST);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
t = t.xyxy(GSVector4::cast(GSVector4i(s->RGBAQ.u32[0], s->FOG)));
|
|
|
|
|
|
|
|
d->p = p;
|
|
|
|
d->t = t;
|
|
|
|
}
|
|
|
|
|
|
|
|
dev->IAUnmapVertexBuffer();
|
|
|
|
}
|
|
|
|
|
|
|
|
dev->IASetIndexBuffer(m_index.buff, m_index.tail);
|
|
|
|
|
|
|
|
dev->IASetPrimitiveTopology(topology);
|
2009-06-27 03:32:33 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void GSRendererDX9::UpdateFBA(GSTexture* rt)
|
|
|
|
{
|
2015-06-05 20:37:34 +00:00
|
|
|
if (!rt)
|
|
|
|
return;
|
|
|
|
|
2009-06-27 03:32:33 +00:00
|
|
|
GSDevice9* dev = (GSDevice9*)m_dev;
|
|
|
|
|
|
|
|
dev->BeginScene();
|
|
|
|
|
|
|
|
// om
|
|
|
|
|
|
|
|
dev->OMSetDepthStencilState(&m_fba.dss);
|
|
|
|
dev->OMSetBlendState(&m_fba.bs, 0);
|
|
|
|
|
|
|
|
// ia
|
|
|
|
|
2009-08-02 23:07:30 +00:00
|
|
|
GSVector4 s = GSVector4(rt->GetScale().x / rt->GetWidth(), rt->GetScale().y / rt->GetHeight());
|
2015-05-15 18:40:09 +00:00
|
|
|
GSVector4 off = GSVector4(-1.0f, 1.0f);
|
2009-06-27 03:32:33 +00:00
|
|
|
|
2015-05-15 18:40:09 +00:00
|
|
|
GSVector4 src = ((m_vt.m_min.p.xyxy(m_vt.m_max.p) + off.xxyy()) * s.xyxy()).sat(off.zzyy());
|
|
|
|
GSVector4 dst = src * 2.0f + off.xxxx();
|
2009-06-27 03:32:33 +00:00
|
|
|
|
|
|
|
GSVertexPT1 vertices[] =
|
|
|
|
{
|
2016-10-13 09:25:48 +00:00
|
|
|
{GSVector4(dst.x, -dst.y, 0.5f, 1.0f), GSVector2(0)},
|
|
|
|
{GSVector4(dst.z, -dst.y, 0.5f, 1.0f), GSVector2(0)},
|
|
|
|
{GSVector4(dst.x, -dst.w, 0.5f, 1.0f), GSVector2(0)},
|
|
|
|
{GSVector4(dst.z, -dst.w, 0.5f, 1.0f), GSVector2(0)},
|
2009-06-27 03:32:33 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
dev->IASetVertexBuffer(vertices, sizeof(vertices[0]), countof(vertices));
|
|
|
|
dev->IASetInputLayout(dev->m_convert.il);
|
|
|
|
dev->IASetPrimitiveTopology(D3DPT_TRIANGLESTRIP);
|
|
|
|
|
|
|
|
// vs
|
|
|
|
|
|
|
|
dev->VSSetShader(dev->m_convert.vs, NULL, 0);
|
|
|
|
|
|
|
|
// ps
|
|
|
|
|
|
|
|
dev->PSSetShader(dev->m_convert.ps[4], NULL, 0);
|
|
|
|
|
|
|
|
//
|
|
|
|
|
|
|
|
dev->DrawPrimitive();
|
|
|
|
|
|
|
|
//
|
|
|
|
|
|
|
|
dev->EndScene();
|
|
|
|
}
|