GPU/SW: Use new 5-to-8 converters for RGBA8 display
This commit is contained in:
parent
6c05413220
commit
b13c51a2e2
|
@ -1245,7 +1245,7 @@ void GPU::ReadVRAM(u32 x, u32 y, u32 width, u32 height) {}
|
||||||
|
|
||||||
void GPU::FillVRAM(u32 x, u32 y, u32 width, u32 height, u32 color)
|
void GPU::FillVRAM(u32 x, u32 y, u32 width, u32 height, u32 color)
|
||||||
{
|
{
|
||||||
const u16 color16 = RGBA8888ToRGBA5551(color);
|
const u16 color16 = VRAMRGBA8888ToRGBA5551(color);
|
||||||
if ((x + width) <= VRAM_WIDTH && !IsInterlacedRenderingEnabled())
|
if ((x + width) <= VRAM_WIDTH && !IsInterlacedRenderingEnabled())
|
||||||
{
|
{
|
||||||
for (u32 yoffs = 0; yoffs < height; yoffs++)
|
for (u32 yoffs = 0; yoffs < height; yoffs++)
|
||||||
|
@ -1507,7 +1507,7 @@ bool GPU::DumpVRAMToFile(const char* filename, u32 width, u32 height, u32 stride
|
||||||
u16 src_col;
|
u16 src_col;
|
||||||
std::memcpy(&src_col, row_ptr_in, sizeof(u16));
|
std::memcpy(&src_col, row_ptr_in, sizeof(u16));
|
||||||
row_ptr_in += sizeof(u16);
|
row_ptr_in += sizeof(u16);
|
||||||
*(ptr_out++) = RGBA5551ToRGBA8888(remove_alpha ? (src_col | u16(0x8000)) : src_col);
|
*(ptr_out++) = VRAMRGBA5551ToRGBA8888(remove_alpha ? (src_col | u16(0x8000)) : src_col);
|
||||||
}
|
}
|
||||||
|
|
||||||
ptr_in += stride;
|
ptr_in += stride;
|
||||||
|
|
|
@ -175,27 +175,6 @@ protected:
|
||||||
}
|
}
|
||||||
ALWAYS_INLINE static constexpr TickCount SystemTicksToGPUTicks(TickCount sysclk_ticks) { return sysclk_ticks << 1; }
|
ALWAYS_INLINE static constexpr TickCount SystemTicksToGPUTicks(TickCount sysclk_ticks) { return sysclk_ticks << 1; }
|
||||||
|
|
||||||
// Helper/format conversion functions - constants from https://stackoverflow.com/a/9069480
|
|
||||||
ALWAYS_INLINE static constexpr u32 Convert5To8(u32 color) { return (((color * 527u) + 23u) >> 6); }
|
|
||||||
ALWAYS_INLINE static constexpr u32 Convert8To5(u32 color) { return (((color * 249u) + 1014u) >> 11); }
|
|
||||||
static constexpr u32 RGBA5551ToRGBA8888(u32 color)
|
|
||||||
{
|
|
||||||
const u32 r = Convert5To8(color & 31u);
|
|
||||||
const u32 g = Convert5To8((color >> 5) & 31u);
|
|
||||||
const u32 b = Convert5To8((color >> 10) & 31u);
|
|
||||||
const u32 a = ((color >> 15) != 0) ? 255 : 0;
|
|
||||||
return ZeroExtend32(r) | (ZeroExtend32(g) << 8) | (ZeroExtend32(b) << 16) | (ZeroExtend32(a) << 24);
|
|
||||||
}
|
|
||||||
|
|
||||||
static constexpr u16 RGBA8888ToRGBA5551(u32 color)
|
|
||||||
{
|
|
||||||
const u32 r = Convert8To5(color & 0xFFu);
|
|
||||||
const u32 g = Convert8To5((color >> 8) & 0xFFu);
|
|
||||||
const u32 b = Convert8To5((color >> 16) & 0xFFu);
|
|
||||||
const u32 a = ((color >> 24) & 0x01u);
|
|
||||||
return Truncate16(r | (g << 5) | (b << 10) | (a << 15));
|
|
||||||
}
|
|
||||||
|
|
||||||
static constexpr std::tuple<u8, u8> UnpackTexcoord(u16 texcoord)
|
static constexpr std::tuple<u8, u8> UnpackTexcoord(u16 texcoord)
|
||||||
{
|
{
|
||||||
return std::make_tuple(static_cast<u8>(texcoord), static_cast<u8>(texcoord >> 8));
|
return std::make_tuple(static_cast<u8>(texcoord), static_cast<u8>(texcoord >> 8));
|
||||||
|
|
|
@ -885,7 +885,7 @@ GPU_HW::VRAMFillUBOData GPU_HW::GetVRAMFillUBOData(u32 x, u32 y, u32 width, u32
|
||||||
{
|
{
|
||||||
// drop precision unless true colour is enabled
|
// drop precision unless true colour is enabled
|
||||||
if (!m_true_color)
|
if (!m_true_color)
|
||||||
color = RGBA5551ToRGBA8888(RGBA8888ToRGBA5551(color));
|
color = VRAMRGBA5551ToRGBA8888(VRAMRGBA8888ToRGBA5551(color));
|
||||||
|
|
||||||
VRAMFillUBOData uniforms;
|
VRAMFillUBOData uniforms;
|
||||||
std::tie(uniforms.u_fill_color[0], uniforms.u_fill_color[1], uniforms.u_fill_color[2], uniforms.u_fill_color[3]) =
|
std::tie(uniforms.u_fill_color[0], uniforms.u_fill_color[1], uniforms.u_fill_color[2], uniforms.u_fill_color[3]) =
|
||||||
|
|
|
@ -1031,7 +1031,8 @@ void GPU_HW_OpenGL::FillVRAM(u32 x, u32 y, u32 width, u32 height, u32 color)
|
||||||
// fast path when not using interlaced rendering
|
// fast path when not using interlaced rendering
|
||||||
if (!IsInterlacedRenderingEnabled())
|
if (!IsInterlacedRenderingEnabled())
|
||||||
{
|
{
|
||||||
const auto [r, g, b, a] = RGBA8ToFloat(m_true_color ? color : RGBA5551ToRGBA8888(RGBA8888ToRGBA5551(color)));
|
const auto [r, g, b, a] =
|
||||||
|
RGBA8ToFloat(m_true_color ? color : VRAMRGBA5551ToRGBA8888(VRAMRGBA8888ToRGBA5551(color)));
|
||||||
glClearColor(r, g, b, a);
|
glClearColor(r, g, b, a);
|
||||||
IsGLES() ? glClearDepthf(a) : glClearDepth(a);
|
IsGLES() ? glClearDepthf(a) : glClearDepth(a);
|
||||||
glClear(GL_COLOR_BUFFER_BIT | GL_DEPTH_BUFFER_BIT);
|
glClear(GL_COLOR_BUFFER_BIT | GL_DEPTH_BUFFER_BIT);
|
||||||
|
@ -1128,7 +1129,7 @@ void GPU_HW_OpenGL::UpdateVRAM(u32 x, u32 y, u32 width, u32 height, const void*
|
||||||
u16 src_col;
|
u16 src_col;
|
||||||
std::memcpy(&src_col, source_row_ptr, sizeof(src_col));
|
std::memcpy(&src_col, source_row_ptr, sizeof(src_col));
|
||||||
source_row_ptr += sizeof(src_col);
|
source_row_ptr += sizeof(src_col);
|
||||||
*(dest_ptr++) = RGBA5551ToRGBA8888(src_col | mask_or);
|
*(dest_ptr++) = VRAMRGBA5551ToRGBA8888(src_col | mask_or);
|
||||||
}
|
}
|
||||||
|
|
||||||
source_ptr -= source_stride;
|
source_ptr -= source_stride;
|
||||||
|
|
|
@ -115,30 +115,16 @@ ALWAYS_INLINE u16 VRAM16ToOutput<HostDisplayPixelFormat::RGB565, u16>(u16 value)
|
||||||
template<>
|
template<>
|
||||||
ALWAYS_INLINE u32 VRAM16ToOutput<HostDisplayPixelFormat::RGBA8, u32>(u16 value)
|
ALWAYS_INLINE u32 VRAM16ToOutput<HostDisplayPixelFormat::RGBA8, u32>(u16 value)
|
||||||
{
|
{
|
||||||
u8 r = Truncate8(value & 31);
|
return VRAMRGBA5551ToRGBA8888(value);
|
||||||
u8 g = Truncate8((value >> 5) & 31);
|
|
||||||
u8 b = Truncate8((value >> 10) & 31);
|
|
||||||
|
|
||||||
// 00012345 -> 1234545
|
|
||||||
b = (b << 3) | (b & 0b111);
|
|
||||||
g = (g << 3) | (g & 0b111);
|
|
||||||
r = (r << 3) | (r & 0b111);
|
|
||||||
|
|
||||||
return ZeroExtend32(r) | (ZeroExtend32(g) << 8) | (ZeroExtend32(b) << 16) | (0xFF000000u);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
template<>
|
template<>
|
||||||
ALWAYS_INLINE u32 VRAM16ToOutput<HostDisplayPixelFormat::BGRA8, u32>(u16 value)
|
ALWAYS_INLINE u32 VRAM16ToOutput<HostDisplayPixelFormat::BGRA8, u32>(u16 value)
|
||||||
{
|
{
|
||||||
u8 r = Truncate8(value & 31);
|
const u32 value32 = ZeroExtend32(value);
|
||||||
u8 g = Truncate8((value >> 5) & 31);
|
const u32 r = VRAMConvert5To8(value32 & 31u);
|
||||||
u8 b = Truncate8((value >> 10) & 31);
|
const u32 g = VRAMConvert5To8((value32 >> 5) & 31u);
|
||||||
|
const u32 b = VRAMConvert5To8((value32 >> 10) & 31u);
|
||||||
// 00012345 -> 1234545
|
|
||||||
b = (b << 3) | (b & 0b111);
|
|
||||||
g = (g << 3) | (g & 0b111);
|
|
||||||
r = (r << 3) | (r & 0b111);
|
|
||||||
|
|
||||||
return ZeroExtend32(b) | (ZeroExtend32(g) << 8) | (ZeroExtend32(r) << 16) | (0xFF000000u);
|
return ZeroExtend32(b) | (ZeroExtend32(g) << 8) | (ZeroExtend32(r) << 16) | (0xFF000000u);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -769,7 +769,7 @@ GPU_SW_Backend::GetDrawRectangleFunction(bool texture_enable, bool raw_texture_e
|
||||||
|
|
||||||
void GPU_SW_Backend::FillVRAM(u32 x, u32 y, u32 width, u32 height, u32 color, GPUBackendCommandParameters params)
|
void GPU_SW_Backend::FillVRAM(u32 x, u32 y, u32 width, u32 height, u32 color, GPUBackendCommandParameters params)
|
||||||
{
|
{
|
||||||
const u16 color16 = RGBA8888ToRGBA5551(color);
|
const u16 color16 = VRAMRGBA8888ToRGBA5551(color);
|
||||||
if ((x + width) <= VRAM_WIDTH && !params.interlaced_rendering)
|
if ((x + width) <= VRAM_WIDTH && !params.interlaced_rendering)
|
||||||
{
|
{
|
||||||
for (u32 yoffs = 0; yoffs < height; yoffs++)
|
for (u32 yoffs = 0; yoffs < height; yoffs++)
|
||||||
|
|
|
@ -114,31 +114,31 @@ union GPURenderCommand
|
||||||
}
|
}
|
||||||
};
|
};
|
||||||
|
|
||||||
// Helper/format conversion functions.
|
// Helper/format conversion functions - constants from https://stackoverflow.com/a/9069480
|
||||||
static constexpr u32 RGBA5551ToRGBA8888(u16 color)
|
ALWAYS_INLINE static constexpr u32 VRAMConvert5To8(u32 color)
|
||||||
{
|
{
|
||||||
u8 r = Truncate8(color & 31);
|
return (((color * 527u) + 23u) >> 6);
|
||||||
u8 g = Truncate8((color >> 5) & 31);
|
}
|
||||||
u8 b = Truncate8((color >> 10) & 31);
|
ALWAYS_INLINE static constexpr u32 VRAMConvert8To5(u32 color)
|
||||||
u8 a = Truncate8((color >> 15) & 1);
|
{
|
||||||
|
return (((color * 249u) + 1014u) >> 11);
|
||||||
// 00012345 -> 1234545
|
}
|
||||||
b = (b << 3) | (b & 0b111);
|
ALWAYS_INLINE static constexpr u32 VRAMRGBA5551ToRGBA8888(u32 color)
|
||||||
g = (g << 3) | (g & 0b111);
|
{
|
||||||
r = (r << 3) | (r & 0b111);
|
const u32 r = VRAMConvert5To8(color & 31u);
|
||||||
a = a ? 255 : 0;
|
const u32 g = VRAMConvert5To8((color >> 5) & 31u);
|
||||||
|
const u32 b = VRAMConvert5To8((color >> 10) & 31u);
|
||||||
|
const u32 a = ((color >> 15) != 0) ? 255 : 0;
|
||||||
return ZeroExtend32(r) | (ZeroExtend32(g) << 8) | (ZeroExtend32(b) << 16) | (ZeroExtend32(a) << 24);
|
return ZeroExtend32(r) | (ZeroExtend32(g) << 8) | (ZeroExtend32(b) << 16) | (ZeroExtend32(a) << 24);
|
||||||
}
|
}
|
||||||
|
|
||||||
static constexpr u16 RGBA8888ToRGBA5551(u32 color)
|
ALWAYS_INLINE static constexpr u16 VRAMRGBA8888ToRGBA5551(u32 color)
|
||||||
{
|
{
|
||||||
const u16 r = Truncate16((color >> 3) & 0x1Fu);
|
const u32 r = VRAMConvert8To5(color & 0xFFu);
|
||||||
const u16 g = Truncate16((color >> 11) & 0x1Fu);
|
const u32 g = VRAMConvert8To5((color >> 8) & 0xFFu);
|
||||||
const u16 b = Truncate16((color >> 19) & 0x1Fu);
|
const u32 b = VRAMConvert8To5((color >> 16) & 0xFFu);
|
||||||
const u16 a = Truncate16((color >> 31) & 0x01u);
|
const u32 a = ((color >> 24) & 0x01u);
|
||||||
|
return Truncate16(r | (g << 5) | (b << 10) | (a << 15));
|
||||||
return r | (g << 5) | (b << 10) | (a << 15);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
union GPUVertexPosition
|
union GPUVertexPosition
|
||||||
|
|
|
@ -15,7 +15,7 @@ Log_SetChannel(TextureReplacements);
|
||||||
|
|
||||||
TextureReplacements g_texture_replacements;
|
TextureReplacements g_texture_replacements;
|
||||||
|
|
||||||
static constexpr u32 RGBA5551ToRGBA8888(u16 color)
|
static constexpr u32 VRAMRGBA5551ToRGBA8888(u16 color)
|
||||||
{
|
{
|
||||||
u8 r = Truncate8(color & 31);
|
u8 r = Truncate8(color & 31);
|
||||||
u8 g = Truncate8((color >> 5) & 31);
|
u8 g = Truncate8((color >> 5) & 31);
|
||||||
|
@ -90,7 +90,7 @@ void TextureReplacements::DumpVRAMWrite(u32 width, u32 height, const void* pixel
|
||||||
{
|
{
|
||||||
for (u32 x = 0; x < width; x++)
|
for (u32 x = 0; x < width; x++)
|
||||||
{
|
{
|
||||||
image.SetPixel(x, y, RGBA5551ToRGBA8888(*src_pixels));
|
image.SetPixel(x, y, VRAMRGBA5551ToRGBA8888(*src_pixels));
|
||||||
src_pixels++;
|
src_pixels++;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in New Issue