121 lines
2.9 KiB
C++
121 lines
2.9 KiB
C++
// Copyright (C) 2003 Dolphin Project.
|
|
|
|
// This program is free software: you can redistribute it and/or modify
|
|
// it under the terms of the GNU General Public License as published by
|
|
// the Free Software Foundation, version 2.0.
|
|
|
|
// This program is distributed in the hope that it will be useful,
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
// GNU General Public License 2.0 for more details.
|
|
|
|
// A copy of the GPL 2.0 should have been included with the program.
|
|
// If not, see http://www.gnu.org/licenses/
|
|
|
|
// Official SVN repository and contact information can be found at
|
|
// http://code.google.com/p/dolphin-emu/
|
|
|
|
#include "Common.h"
|
|
#include "FPURoundMode.h"
|
|
|
|
#ifndef _WIN32
|
|
static const unsigned short FPU_ROUND_NEAR = 0 << 10;
|
|
static const unsigned short FPU_ROUND_DOWN = 1 << 10;
|
|
static const unsigned short FPU_ROUND_UP = 2 << 10;
|
|
static const unsigned short FPU_ROUND_CHOP = 3 << 10;
|
|
static const unsigned short FPU_ROUND_MASK = 3 << 10;
|
|
#include <xmmintrin.h>
|
|
#endif
|
|
|
|
const u32 MASKS = 0x1F80; // mask away the interrupts.
|
|
const u32 DAZ = 0x40;
|
|
const u32 FTZ = 0x8000;
|
|
|
|
namespace FPURoundMode
|
|
{
|
|
// Get the default SSE states here.
|
|
static u32 saved_sse_state = _mm_getcsr();
|
|
static const u32 default_sse_state = _mm_getcsr();
|
|
|
|
void SetRoundMode(u32 mode)
|
|
{
|
|
// Set FPU rounding mode to mimic the PowerPC's
|
|
#ifdef _M_IX86
|
|
// This shouldn't really be needed anymore since we use SSE
|
|
#ifdef _WIN32
|
|
const int table[4] =
|
|
{
|
|
_RC_NEAR,
|
|
_RC_CHOP,
|
|
_RC_UP,
|
|
_RC_DOWN
|
|
};
|
|
_set_controlfp(_MCW_RC, table[mode]);
|
|
#else
|
|
const unsigned short table[4] =
|
|
{
|
|
FPU_ROUND_NEAR,
|
|
FPU_ROUND_CHOP,
|
|
FPU_ROUND_UP,
|
|
FPU_ROUND_DOWN
|
|
};
|
|
unsigned short _mode;
|
|
asm ("fstcw %0" : "=m" (_mode) : );
|
|
_mode = (_mode & ~FPU_ROUND_MASK) | table[mode];
|
|
asm ("fldcw %0" : : "m" (_mode));
|
|
#endif
|
|
#endif
|
|
}
|
|
|
|
void SetPrecisionMode(u32 mode)
|
|
{
|
|
#ifdef _M_IX86
|
|
// sets the floating-point lib to 53-bit
|
|
// PowerPC has a 53bit floating pipeline only
|
|
// eg: sscanf is very sensitive
|
|
#ifdef _WIN32
|
|
_control87(_PC_53, MCW_PC);
|
|
#else
|
|
const unsigned short table[4] = {
|
|
0 << 8, // FPU_PREC_24
|
|
2 << 8, // FPU_PREC_53
|
|
3 << 8, // FPU_PREC_64
|
|
3 << 8, // FPU_PREC_MASK
|
|
};
|
|
unsigned short _mode;
|
|
asm ("fstcw %0" : : "m" (_mode));
|
|
_mode = (_mode & ~table[3]) | table[mode];
|
|
asm ("fldcw %0" : : "m" (_mode));
|
|
#endif
|
|
#else
|
|
//x64 doesn't need this - fpu is done with SSE
|
|
//but still - set any useful sse options here
|
|
#endif
|
|
}
|
|
void SetSIMDMode(u32 mode)
|
|
{
|
|
static const u32 ssetable[4] =
|
|
{
|
|
(0 << 13) | MASKS,
|
|
(3 << 13) | MASKS,
|
|
(2 << 13) | MASKS,
|
|
(1 << 13) | MASKS,
|
|
};
|
|
u32 csr = ssetable[mode];
|
|
_mm_setcsr(csr);
|
|
}
|
|
|
|
void SaveSIMDState()
|
|
{
|
|
saved_sse_state = _mm_getcsr();
|
|
}
|
|
void LoadSIMDState()
|
|
{
|
|
_mm_setcsr(saved_sse_state);
|
|
}
|
|
void LoadDefaultSIMDState()
|
|
{
|
|
_mm_setcsr(default_sse_state);
|
|
}
|
|
}
|