2015-05-24 04:55:12 +00:00
|
|
|
// Copyright 2008 Dolphin Emulator Project
|
2021-07-05 01:22:19 +00:00
|
|
|
// SPDX-License-Identifier: GPL-2.0-or-later
|
2009-02-23 06:17:57 +00:00
|
|
|
|
2014-02-10 18:54:46 +00:00
|
|
|
#pragma once
|
2019-07-17 00:18:48 +00:00
|
|
|
|
2021-04-26 09:55:38 +00:00
|
|
|
#include <algorithm>
|
2022-10-10 09:03:15 +00:00
|
|
|
#include <bit>
|
2021-04-26 09:55:38 +00:00
|
|
|
|
|
|
|
#include "Common/BitUtils.h"
|
2014-09-08 01:06:58 +00:00
|
|
|
#include "Common/CommonTypes.h"
|
2009-02-23 06:17:57 +00:00
|
|
|
|
2021-04-26 09:55:38 +00:00
|
|
|
#include "VideoCommon/BPMemory.h"
|
|
|
|
|
2009-02-28 19:02:37 +00:00
|
|
|
// These are accurate (disregarding AA modes).
|
2019-04-28 09:39:59 +00:00
|
|
|
constexpr u32 EFB_WIDTH = 640;
|
|
|
|
constexpr u32 EFB_HEIGHT = 528;
|
2009-02-23 06:17:57 +00:00
|
|
|
|
2015-07-24 17:46:41 +00:00
|
|
|
// Max XFB width is 720. You can only copy out 640 wide areas of efb to XFB
|
|
|
|
// so you need multiple copies to do the full width.
|
|
|
|
// The VI can do horizontal scaling (TODO: emulate).
|
2019-04-28 09:39:59 +00:00
|
|
|
constexpr u32 MAX_XFB_WIDTH = 720;
|
2009-07-15 00:51:24 +00:00
|
|
|
|
2016-11-10 00:41:16 +00:00
|
|
|
// Although EFB height is 528, 576-line XFB's can be created either with
|
2012-12-30 09:28:50 +00:00
|
|
|
// vertical scaling by the EFB copy operation or copying to multiple XFB's
|
|
|
|
// that are next to each other in memory (TODO: handle that situation).
|
2019-04-28 09:39:59 +00:00
|
|
|
constexpr u32 MAX_XFB_HEIGHT = 576;
|
2009-02-23 06:17:57 +00:00
|
|
|
|
2022-08-23 18:14:47 +00:00
|
|
|
#define PRIM_LOG(t, ...) DEBUG_LOG_FMT(VIDEO, t __VA_OPT__(, ) __VA_ARGS__)
|
2009-02-23 06:17:57 +00:00
|
|
|
|
2013-02-21 10:45:29 +00:00
|
|
|
// warning: mapping buffer should be disabled to use this
|
2020-11-14 03:33:26 +00:00
|
|
|
// #define LOG_VTX() DEBUG_LOG_FMT(VIDEO, "vtx: {} {} {}, ",
|
|
|
|
// ((float*)g_vertex_manager_write_ptr)[-3],
|
|
|
|
// ((float*)g_vertex_manager_write_ptr)[-2],
|
|
|
|
// ((float*)g_vertex_manager_write_ptr)[-1]);
|
2009-09-08 21:16:05 +00:00
|
|
|
|
|
|
|
#define LOG_VTX()
|
2009-02-23 06:17:57 +00:00
|
|
|
|
2016-07-21 23:04:57 +00:00
|
|
|
enum class APIType
|
2010-06-14 14:36:01 +00:00
|
|
|
{
|
2016-07-21 23:04:57 +00:00
|
|
|
OpenGL,
|
|
|
|
D3D,
|
2016-08-12 14:55:00 +00:00
|
|
|
Vulkan,
|
2022-06-01 09:58:13 +00:00
|
|
|
Metal,
|
2016-07-21 23:04:57 +00:00
|
|
|
Nothing
|
2015-09-14 23:43:31 +00:00
|
|
|
};
|
2010-06-14 14:36:01 +00:00
|
|
|
|
2010-12-27 03:09:11 +00:00
|
|
|
inline u32 RGBA8ToRGBA6ToRGBA8(u32 src)
|
|
|
|
{
|
|
|
|
u32 color = src;
|
|
|
|
color &= 0xFCFCFCFC;
|
|
|
|
color |= (color >> 6) & 0x03030303;
|
|
|
|
return color;
|
|
|
|
}
|
|
|
|
|
2010-12-27 18:09:03 +00:00
|
|
|
inline u32 RGBA8ToRGB565ToRGBA8(u32 src)
|
2010-12-27 03:09:11 +00:00
|
|
|
{
|
2011-01-29 04:31:56 +00:00
|
|
|
u32 color = (src & 0xF8FCF8);
|
|
|
|
color |= (color >> 5) & 0x070007;
|
|
|
|
color |= (color >> 6) & 0x000300;
|
|
|
|
color |= 0xFF000000;
|
2010-12-27 03:09:11 +00:00
|
|
|
return color;
|
|
|
|
}
|
|
|
|
|
2010-12-27 18:09:03 +00:00
|
|
|
inline u32 Z24ToZ16ToZ24(u32 src)
|
|
|
|
{
|
|
|
|
return (src & 0xFFFF00) | (src >> 16);
|
|
|
|
}
|
2021-04-26 09:55:38 +00:00
|
|
|
|
|
|
|
inline u32 CompressZ16(u32 z24depth, DepthFormat format)
|
|
|
|
{
|
|
|
|
// Flipper offers a number of choices for 16bit Z formats that adjust
|
|
|
|
// where the bulk of the precision lies.
|
|
|
|
|
|
|
|
if (format == DepthFormat::ZLINEAR)
|
|
|
|
{
|
|
|
|
// This is just a linear depth buffer with 16 bits of precision
|
|
|
|
return z24depth >> 8;
|
|
|
|
}
|
|
|
|
|
|
|
|
// ZNEAR/ZMID/ZFAR are custom floating point formats with 2/3/4 bits of exponent
|
|
|
|
// The exponent is simply the number of leading ones that have been removed
|
|
|
|
// The first zero bit is skipped and not stored. The mantissa contains the next 14/13/12 bits
|
|
|
|
// If exponent is at the MAX (3, 7, or 12) then the next bit might still be a one, and can't
|
|
|
|
// be skipped, so the mantissa simply contains the next 14/13/12 bits
|
|
|
|
|
2022-10-10 09:03:15 +00:00
|
|
|
u32 leading_ones = static_cast<u32>(std::countl_one(z24depth << 8));
|
2021-04-26 09:55:38 +00:00
|
|
|
bool next_bit_is_one = false; // AKA: Did we clamp leading_ones?
|
|
|
|
u32 exp_bits;
|
|
|
|
|
|
|
|
switch (format)
|
|
|
|
{
|
|
|
|
case DepthFormat::ZNEAR:
|
|
|
|
exp_bits = 2;
|
|
|
|
if (leading_ones >= 3u)
|
|
|
|
{
|
|
|
|
leading_ones = 3u;
|
|
|
|
next_bit_is_one = true;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case DepthFormat::ZMID:
|
|
|
|
exp_bits = 3;
|
|
|
|
if (leading_ones >= 7u)
|
|
|
|
{
|
|
|
|
leading_ones = 7u;
|
|
|
|
next_bit_is_one = true;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case DepthFormat::ZFAR:
|
|
|
|
exp_bits = 4;
|
|
|
|
if (leading_ones >= 12u)
|
|
|
|
{
|
|
|
|
// The hardware implementation only uses values 0 to 12 in the exponent
|
|
|
|
leading_ones = 12u;
|
|
|
|
next_bit_is_one = true;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
return z24depth >> 8;
|
|
|
|
}
|
|
|
|
|
|
|
|
u32 mantissa_bits = 16 - exp_bits;
|
|
|
|
|
|
|
|
// Calculate which bits we need to extract from z24depth for our mantissa
|
|
|
|
u32 top = std::max<u32>(24 - leading_ones, mantissa_bits);
|
|
|
|
if (!next_bit_is_one)
|
|
|
|
{
|
|
|
|
top -= 1; // We know the next bit is zero, so we don't need to include it.
|
|
|
|
}
|
|
|
|
u32 bottom = top - mantissa_bits;
|
|
|
|
|
|
|
|
u32 exponent = leading_ones << mantissa_bits; // Upper bits contain exponent
|
|
|
|
u32 mantissa = Common::ExtractBits(z24depth, bottom, top - 1);
|
|
|
|
|
|
|
|
return exponent | mantissa;
|
|
|
|
}
|