Fixed 24 bit depth copies to RAM. 24 and 16 bit depth copies are now more accurate. Added an offset to DX copies to RAM and made half sized copies to a texture linearly filtered.
git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@4635 8ced0084-cf51-0410-be5f-012b33b47a6e
This commit is contained in:
parent
6e56ea80f7
commit
e6d51e8ff4
|
@ -612,18 +612,31 @@ void WriteZ16Encoder(char* p,bool HLSL)
|
||||||
WriteSwizzler(p, GX_TF_Z16,HLSL);
|
WriteSwizzler(p, GX_TF_Z16,HLSL);
|
||||||
|
|
||||||
WRITE(p, " float depth;\n");
|
WRITE(p, " float depth;\n");
|
||||||
|
WRITE(p, " float3 expanded;\n");
|
||||||
|
|
||||||
// byte order is reversed
|
// byte order is reversed
|
||||||
|
|
||||||
WriteSampleColor(p, "b", "depth",HLSL);
|
WriteSampleColor(p, "b", "depth",HLSL);
|
||||||
WRITE(p, " ocol0.b = frac(depth * 256.0f);\n");
|
|
||||||
WRITE(p, " ocol0.g = depth;\n");
|
WRITE(p, " depth *= 16777215.0f;\n");
|
||||||
|
WRITE(p, " expanded.r = floor(depth / (256 * 256));\n");
|
||||||
|
WRITE(p, " depth -= expanded.r * 256 * 256;\n");
|
||||||
|
WRITE(p, " expanded.g = floor(depth / 256);\n");
|
||||||
|
|
||||||
|
WRITE(p, " ocol0.b = expanded.g / 255;\n");
|
||||||
|
WRITE(p, " ocol0.g = expanded.r / 255;\n");
|
||||||
|
|
||||||
WriteIncrementSampleX(p,HLSL);
|
WriteIncrementSampleX(p,HLSL);
|
||||||
|
|
||||||
WriteSampleColor(p, "b", "depth",HLSL);
|
WriteSampleColor(p, "b", "depth",HLSL);
|
||||||
WRITE(p, " ocol0.r = frac(depth * 256.0f);\n");
|
|
||||||
WRITE(p, " ocol0.a = depth;\n");
|
WRITE(p, " depth *= 16777215.0f;\n");
|
||||||
|
WRITE(p, " expanded.r = floor(depth / (256 * 256));\n");
|
||||||
|
WRITE(p, " depth -= expanded.r * 256 * 256;\n");
|
||||||
|
WRITE(p, " expanded.g = floor(depth / 256);\n");
|
||||||
|
|
||||||
|
WRITE(p, " ocol0.r = expanded.g / 255;\n");
|
||||||
|
WRITE(p, " ocol0.a = expanded.r / 255;\n");
|
||||||
|
|
||||||
WriteEncoderEnd(p);
|
WriteEncoderEnd(p);
|
||||||
}
|
}
|
||||||
|
@ -633,18 +646,35 @@ void WriteZ16LEncoder(char* p,bool HLSL)
|
||||||
WriteSwizzler(p, GX_CTF_Z16L,HLSL);
|
WriteSwizzler(p, GX_CTF_Z16L,HLSL);
|
||||||
|
|
||||||
WRITE(p, " float depth;\n");
|
WRITE(p, " float depth;\n");
|
||||||
|
WRITE(p, " float3 expanded;\n");
|
||||||
|
|
||||||
// byte order is reversed
|
// byte order is reversed
|
||||||
|
|
||||||
WriteSampleColor(p, "b", "depth",HLSL);
|
WriteSampleColor(p, "b", "depth",HLSL);
|
||||||
WRITE(p, " ocol0.b = frac(depth * 65536.0f);\n");
|
|
||||||
WRITE(p, " ocol0.g = frac(depth * 256.0f);\n");
|
WRITE(p, " depth *= 16777215.0f;\n");
|
||||||
|
WRITE(p, " expanded.r = floor(depth / (256 * 256));\n");
|
||||||
|
WRITE(p, " depth -= expanded.r * 256 * 256;\n");
|
||||||
|
WRITE(p, " expanded.g = floor(depth / 256);\n");
|
||||||
|
WRITE(p, " depth -= expanded.g * 256;\n");
|
||||||
|
WRITE(p, " expanded.b = depth;\n");
|
||||||
|
|
||||||
|
WRITE(p, " ocol0.b = expanded.b / 255;\n");
|
||||||
|
WRITE(p, " ocol0.g = expanded.g / 255;\n");
|
||||||
|
|
||||||
WriteIncrementSampleX(p,HLSL);
|
WriteIncrementSampleX(p,HLSL);
|
||||||
|
|
||||||
WriteSampleColor(p, "b", "depth",HLSL);
|
WriteSampleColor(p, "b", "depth",HLSL);
|
||||||
WRITE(p, " ocol0.r = frac(depth * 65536.0f);\n");
|
|
||||||
WRITE(p, " ocol0.a = frac(depth * 256.0f);\n");
|
WRITE(p, " depth *= 16777215.0f;\n");
|
||||||
|
WRITE(p, " expanded.r = floor(depth / (256 * 256));\n");
|
||||||
|
WRITE(p, " depth -= expanded.r * 256 * 256;\n");
|
||||||
|
WRITE(p, " expanded.g = floor(depth / 256);\n");
|
||||||
|
WRITE(p, " depth -= expanded.g * 256;\n");
|
||||||
|
WRITE(p, " expanded.b = depth;\n");
|
||||||
|
|
||||||
|
WRITE(p, " ocol0.r = expanded.b;\n");
|
||||||
|
WRITE(p, " ocol0.a = expanded.g;\n");
|
||||||
|
|
||||||
WriteEncoderEnd(p);
|
WriteEncoderEnd(p);
|
||||||
}
|
}
|
||||||
|
@ -657,24 +687,38 @@ void WriteZ24Encoder(char* p, bool HLSL)
|
||||||
|
|
||||||
WRITE(p, " float depth0;\n");
|
WRITE(p, " float depth0;\n");
|
||||||
WRITE(p, " float depth1;\n");
|
WRITE(p, " float depth1;\n");
|
||||||
|
WRITE(p, " float3 expanded0;\n");
|
||||||
|
WRITE(p, " float3 expanded1;\n");
|
||||||
|
|
||||||
WriteSampleColor(p, "b", "depth0",HLSL);
|
WriteSampleColor(p, "b", "depth0",HLSL);
|
||||||
WriteIncrementSampleX(p,HLSL);
|
WriteIncrementSampleX(p,HLSL);
|
||||||
WriteSampleColor(p, "b", "depth1",HLSL);
|
WriteSampleColor(p, "b", "depth1",HLSL);
|
||||||
|
|
||||||
|
for (int i = 0; i < 2; i++)
|
||||||
|
{
|
||||||
|
WRITE(p, " depth%i *= 16777215.0f;\n", i);
|
||||||
|
|
||||||
|
WRITE(p, " expanded%i.r = floor(depth%i / (256 * 256));\n", i, i);
|
||||||
|
WRITE(p, " depth%i -= expanded%i.r * 256 * 256;\n", i, i);
|
||||||
|
WRITE(p, " expanded%i.g = floor(depth%i / 256);\n", i, i);
|
||||||
|
WRITE(p, " depth%i -= expanded%i.g * 256;\n", i, i);
|
||||||
|
WRITE(p, " expanded%i.b = depth%i;\n", i, i);
|
||||||
|
}
|
||||||
|
|
||||||
WRITE(p, " if(cl > 0.5f) {\n");
|
WRITE(p, " if(cl > 0.5f) {\n");
|
||||||
// upper 16
|
// upper 16
|
||||||
WRITE(p, " ocol0.b = frac(depth0 * 256.0f);\n");
|
WRITE(p, " ocol0.b = expanded0.g / 255;\n");
|
||||||
WRITE(p, " ocol0.g = depth0;\n");
|
WRITE(p, " ocol0.g = expanded0.b / 255;\n");
|
||||||
WRITE(p, " ocol0.r = frac(depth1 * 256.0f);\n");
|
WRITE(p, " ocol0.r = expanded1.g / 255;\n");
|
||||||
WRITE(p, " ocol0.a = depth1;\n");
|
WRITE(p, " ocol0.a = expanded1.b / 255;\n");
|
||||||
WRITE(p, " } else {\n");
|
WRITE(p, " } else {\n");
|
||||||
// lower 8
|
// lower 8
|
||||||
WRITE(p, " ocol0.b = 1.0f;\n");
|
WRITE(p, " ocol0.b = 1.0f;\n");
|
||||||
WRITE(p, " ocol0.g = frac(depth0 * 65536.0f);\n");
|
WRITE(p, " ocol0.g = expanded0.r / 255;\n");
|
||||||
WRITE(p, " ocol0.r = 1.0f;\n");
|
WRITE(p, " ocol0.r = 1.0f;\n");
|
||||||
WRITE(p, " ocol0.a = frac(depth0 * 65536.0f);\n");
|
WRITE(p, " ocol0.a = expanded1.r / 255;\n");
|
||||||
WRITE(p, " }\n");
|
WRITE(p, " }\n");
|
||||||
|
|
||||||
WriteEncoderEnd(p);
|
WriteEncoderEnd(p);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -180,7 +180,7 @@ int TexDecoder_GetBlockHeightInTexels(u32 format)
|
||||||
case GX_CTF_GB8: return 4;
|
case GX_CTF_GB8: return 4;
|
||||||
case GX_TF_Z8: return 4;
|
case GX_TF_Z8: return 4;
|
||||||
case GX_TF_Z16: return 4;
|
case GX_TF_Z16: return 4;
|
||||||
case GX_TF_Z24X8: return 1;
|
case GX_TF_Z24X8: return 4;
|
||||||
case GX_CTF_Z4: return 8;
|
case GX_CTF_Z4: return 8;
|
||||||
case GX_CTF_Z8M: return 4;
|
case GX_CTF_Z8M: return 4;
|
||||||
case GX_CTF_Z8L: return 4;
|
case GX_CTF_Z8L: return 4;
|
||||||
|
|
|
@ -474,20 +474,16 @@ have_texture:
|
||||||
sourcerect.left = targetSource.left;
|
sourcerect.left = targetSource.left;
|
||||||
sourcerect.right = targetSource.right;
|
sourcerect.right = targetSource.right;
|
||||||
sourcerect.top = targetSource.top;
|
sourcerect.top = targetSource.top;
|
||||||
if(bFromZBuffer)
|
|
||||||
{
|
if(bScaleByHalf)
|
||||||
|
D3D::dev->SetSamplerState(0, D3DSAMP_MINFILTER, D3DTEXF_LINEAR);
|
||||||
|
else
|
||||||
D3D::dev->SetSamplerState(0, D3DSAMP_MINFILTER, D3DTEXF_POINT);
|
D3D::dev->SetSamplerState(0, D3DSAMP_MINFILTER, D3DTEXF_POINT);
|
||||||
D3D::dev->SetSamplerState(0, D3DSAMP_MAGFILTER, D3DTEXF_POINT);
|
|
||||||
D3D::dev->SetSamplerState(0, D3DSAMP_MIPFILTER, D3DTEXF_POINT);
|
|
||||||
}
|
|
||||||
D3DFORMAT bformat = FBManager::GetEFBDepthRTSurfaceFormat();
|
D3DFORMAT bformat = FBManager::GetEFBDepthRTSurfaceFormat();
|
||||||
D3D::drawShadedTexQuad(read_texture,&sourcerect, Renderer::GetTargetWidth() , Renderer::GetTargetHeight(),&destrect,((bformat != FOURCC_RAWZ && bformat != D3DFMT_D24X8) && bFromZBuffer)? PixelShaderCache::GetDepthMatrixProgram(): PixelShaderCache::GetColorMatrixProgram(),VertexShaderCache::GetSimpleVertexShader());
|
D3D::drawShadedTexQuad(read_texture,&sourcerect, Renderer::GetTargetWidth() , Renderer::GetTargetHeight(),&destrect,((bformat != FOURCC_RAWZ && bformat != D3DFMT_D24X8) && bFromZBuffer)? PixelShaderCache::GetDepthMatrixProgram(): PixelShaderCache::GetColorMatrixProgram(),VertexShaderCache::GetSimpleVertexShader());
|
||||||
if(bFromZBuffer)
|
|
||||||
{
|
|
||||||
D3D::RefreshSamplerState(0, D3DSAMP_MINFILTER);
|
D3D::RefreshSamplerState(0, D3DSAMP_MINFILTER);
|
||||||
D3D::RefreshSamplerState(0, D3DSAMP_MAGFILTER);
|
|
||||||
D3D::RefreshSamplerState(0, D3DSAMP_MIPFILTER);
|
|
||||||
}
|
|
||||||
|
|
||||||
D3D::dev->SetRenderTarget(0, FBManager::GetEFBColorRTSurface());
|
D3D::dev->SetRenderTarget(0, FBManager::GetEFBColorRTSurface());
|
||||||
D3D::dev->SetDepthStencilSurface(FBManager::GetEFBDepthRTSurface());
|
D3D::dev->SetDepthStencilSurface(FBManager::GetEFBDepthRTSurface());
|
||||||
|
|
|
@ -176,7 +176,7 @@ void Shutdown()
|
||||||
s_texConvFrameBuffer = NULL;*/
|
s_texConvFrameBuffer = NULL;*/
|
||||||
}
|
}
|
||||||
|
|
||||||
void EncodeToRamUsingShader(LPDIRECT3DPIXELSHADER9 shader, LPDIRECT3DTEXTURE9 srcTexture,int srcTextureWidth,int srcTextureHeight, const TargetRectangle& sourceRc,
|
void EncodeToRamUsingShader(LPDIRECT3DPIXELSHADER9 shader, LPDIRECT3DTEXTURE9 srcTexture, const TargetRectangle& sourceRc,
|
||||||
u8* destAddr, int dstWidth, int dstHeight, int readStride, bool toTexture, bool linearFilter)
|
u8* destAddr, int dstWidth, int dstHeight, int readStride, bool toTexture, bool linearFilter)
|
||||||
{
|
{
|
||||||
HRESULT hr;
|
HRESULT hr;
|
||||||
|
@ -227,7 +227,7 @@ void EncodeToRamUsingShader(LPDIRECT3DPIXELSHADER9 shader, LPDIRECT3DTEXTURE9 sr
|
||||||
|
|
||||||
|
|
||||||
// Draw...
|
// Draw...
|
||||||
D3D::drawShadedTexQuad(srcTexture,&SrcRect,srcTextureWidth,srcTextureHeight,&DstRect,shader,VertexShaderCache::GetSimpleVertexShader());
|
D3D::drawShadedTexQuad(srcTexture,&SrcRect,1,1,&DstRect,shader,VertexShaderCache::GetSimpleVertexShader());
|
||||||
hr = D3D::dev->SetRenderTarget(0, FBManager::GetEFBColorRTSurface());
|
hr = D3D::dev->SetRenderTarget(0, FBManager::GetEFBColorRTSurface());
|
||||||
hr = D3D::dev->SetDepthStencilSurface(FBManager::GetEFBDepthRTSurface());
|
hr = D3D::dev->SetDepthStencilSurface(FBManager::GetEFBDepthRTSurface());
|
||||||
Renderer::RestoreAPIState();
|
Renderer::RestoreAPIState();
|
||||||
|
@ -258,20 +258,20 @@ void EncodeToRamUsingShader(LPDIRECT3DPIXELSHADER9 shader, LPDIRECT3DTEXTURE9 sr
|
||||||
// writing to a texture of a different size
|
// writing to a texture of a different size
|
||||||
|
|
||||||
int readHeight = readStride / dstWidth;
|
int readHeight = readStride / dstWidth;
|
||||||
//readHeight /= 4; // 4 bytes per pixel
|
|
||||||
|
|
||||||
int readStart = 0;
|
int readStart = 0;
|
||||||
int readLoops = dstHeight / (readHeight/4);
|
int readLoops = dstHeight / (readHeight/4); // 4 bytes per pixel
|
||||||
u8 *Source = (u8*)drect.pBits;
|
u8 *Source = (u8*)drect.pBits;
|
||||||
for (int i = 0; i < readLoops; i++)
|
for (int i = 0; i < readLoops; i++)
|
||||||
{
|
{
|
||||||
memcpy(destAddr,Source,dstWidth*readHeight);
|
int readDist = dstWidth*readHeight;
|
||||||
Source += readHeight;
|
memcpy(destAddr,Source,readDist);
|
||||||
|
Source += readDist;
|
||||||
destAddr += writeStride;
|
destAddr += writeStride;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
else
|
else
|
||||||
memcpy(destAddr,drect.pBits,dstWidth*dstHeight*4);
|
memcpy(destAddr,drect.pBits,dstWidth*dstHeight*4);// 4 bytes per pixel
|
||||||
|
|
||||||
hr = s_tempConvReadSurface->UnlockRect();
|
hr = s_tempConvReadSurface->UnlockRect();
|
||||||
}
|
}
|
||||||
|
@ -330,8 +330,8 @@ void EncodeToRam(u32 address, bool bFromZBuffer, bool bIsIntensityFmt, u32 copyf
|
||||||
TextureConversionShader::SetShaderParameters(
|
TextureConversionShader::SetShaderParameters(
|
||||||
(float)expandedWidth,
|
(float)expandedWidth,
|
||||||
expandedHeight * MValueY,
|
expandedHeight * MValueY,
|
||||||
source.left * MValueX,
|
source.left * MValueX + 0.5f,
|
||||||
top,
|
top + 0.5f,
|
||||||
sampleStride * MValueX,
|
sampleStride * MValueX,
|
||||||
sampleStride * MValueY,
|
sampleStride * MValueY,
|
||||||
(float)Renderer::GetTargetWidth(),
|
(float)Renderer::GetTargetWidth(),
|
||||||
|
@ -347,7 +347,7 @@ void EncodeToRam(u32 address, bool bFromZBuffer, bool bIsIntensityFmt, u32 copyf
|
||||||
cacheBytes = 64;
|
cacheBytes = 64;
|
||||||
|
|
||||||
int readStride = (expandedWidth * cacheBytes) / TexDecoder_GetBlockWidthInTexels(format);
|
int readStride = (expandedWidth * cacheBytes) / TexDecoder_GetBlockWidthInTexels(format);
|
||||||
EncodeToRamUsingShader(texconv_shader, source_texture,1,1, scaledSource, dest_ptr, expandedWidth / samples, expandedHeight,readStride, true, bScaleByHalf > 0);
|
EncodeToRamUsingShader(texconv_shader, source_texture, scaledSource, dest_ptr, expandedWidth / samples, expandedHeight,readStride, true, bScaleByHalf > 0);
|
||||||
}
|
}
|
||||||
|
|
||||||
/*void EncodeToRamYUYV(GLuint srcTexture, const TargetRectangle& sourceRc,
|
/*void EncodeToRamYUYV(GLuint srcTexture, const TargetRectangle& sourceRc,
|
||||||
|
|
|
@ -68,7 +68,7 @@ void SaveTexture(const char* filename, u32 texmap)
|
||||||
|
|
||||||
TexImage0& ti0 = texUnit.texImage0[subTexmap];
|
TexImage0& ti0 = texUnit.texImage0[subTexmap];
|
||||||
|
|
||||||
SaveTexture(filename, texmap, ti0.width, ti0.height);
|
SaveTexture(filename, texmap, ti0.width + 1, ti0.height + 1);
|
||||||
}
|
}
|
||||||
|
|
||||||
void GetTextureBGRA(u8 *dst, u32 texmap, int width, int height)
|
void GetTextureBGRA(u8 *dst, u32 texmap, int width, int height)
|
||||||
|
|
|
@ -584,6 +584,14 @@ void Tev::Draw()
|
||||||
float scaleT = bpmem.texscale[stageNum2].getScaleT(stageOdd);
|
float scaleT = bpmem.texscale[stageNum2].getScaleT(stageOdd);
|
||||||
|
|
||||||
TextureSampler::Sample(Uv[texcoordSel][0] * scaleS, Uv[texcoordSel][1] * scaleT, Lod[texcoordSel], texmap, IndirectTex[stageNum]);
|
TextureSampler::Sample(Uv[texcoordSel][0] * scaleS, Uv[texcoordSel][1] * scaleT, Lod[texcoordSel], texmap, IndirectTex[stageNum]);
|
||||||
|
|
||||||
|
#ifdef _DEBUG
|
||||||
|
if (g_Config.bDumpTevStages)
|
||||||
|
{
|
||||||
|
u8 stage[4] = {(u8)IndirectTex[stageNum][3], (u8)IndirectTex[stageNum][2], (u8)IndirectTex[stageNum][1], 255};
|
||||||
|
DebugUtil::DrawObjectBuffer(Position[0], Position[1], stage, 16+stageNum, "Ind");
|
||||||
|
}
|
||||||
|
#endif
|
||||||
}
|
}
|
||||||
|
|
||||||
for (unsigned int stageNum = 0; stageNum <= bpmem.genMode.numtevstages; stageNum++)
|
for (unsigned int stageNum = 0; stageNum <= bpmem.genMode.numtevstages; stageNum++)
|
||||||
|
|
Loading…
Reference in New Issue