// Copyright (C) 2003 Dolphin Project. // This program is free software: you can redistribute it and/or modify // it under the terms of the GNU General Public License as published by // the Free Software Foundation, version 2.0. // This program is distributed in the hope that it will be useful, // but WITHOUT ANY WARRANTY; without even the implied warranty of // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the // GNU General Public License 2.0 for more details. // A copy of the GPL 2.0 should have been included with the program. // If not, see http://www.gnu.org/licenses/ // Official Git repository and contact information can be found at // http://code.google.com/p/dolphin-emu/ #include "Common.h" #include "FPURoundMode.h" #ifndef _WIN32 static const unsigned short FPU_ROUND_NEAR = 0 << 10; static const unsigned short FPU_ROUND_DOWN = 1 << 10; static const unsigned short FPU_ROUND_UP = 2 << 10; static const unsigned short FPU_ROUND_CHOP = 3 << 10; static const unsigned short FPU_ROUND_MASK = 3 << 10; #include #endif const u32 MASKS = 0x1F80; // mask away the interrupts. const u32 DAZ = 0x40; const u32 FTZ = 0x8000; namespace FPURoundMode { // Get the default SSE states here. static u32 saved_sse_state = _mm_getcsr(); static const u32 default_sse_state = _mm_getcsr(); void SetRoundMode(u32 mode) { // Set FPU rounding mode to mimic the PowerPC's #ifdef _M_IX86 // This shouldn't really be needed anymore since we use SSE #ifdef _WIN32 const int table[4] = { _RC_NEAR, _RC_CHOP, _RC_UP, _RC_DOWN }; _set_controlfp(_MCW_RC, table[mode]); #else const unsigned short table[4] = { FPU_ROUND_NEAR, FPU_ROUND_CHOP, FPU_ROUND_UP, FPU_ROUND_DOWN }; unsigned short _mode; asm ("fstcw %0" : "=m" (_mode) : ); _mode = (_mode & ~FPU_ROUND_MASK) | table[mode]; asm ("fldcw %0" : : "m" (_mode)); #endif #endif } void SetPrecisionMode(u32 mode) { #ifdef _M_IX86 // sets the floating-point lib to 53-bit // PowerPC has a 53bit floating pipeline only // eg: sscanf is very sensitive #ifdef _WIN32 _control87(_PC_53, MCW_PC); #else const unsigned short table[4] = { 0 << 8, // FPU_PREC_24 2 << 8, // FPU_PREC_53 3 << 8, // FPU_PREC_64 3 << 8, // FPU_PREC_MASK }; unsigned short _mode; asm ("fstcw %0" : : "m" (_mode)); _mode = (_mode & ~table[3]) | table[mode]; asm ("fldcw %0" : : "m" (_mode)); #endif #else //x64 doesn't need this - fpu is done with SSE //but still - set any useful sse options here #endif } void SetSIMDMode(u32 mode) { static const u32 ssetable[4] = { (0 << 13) | MASKS, (3 << 13) | MASKS, (2 << 13) | MASKS, (1 << 13) | MASKS, }; u32 csr = ssetable[mode]; _mm_setcsr(csr); } void SaveSIMDState() { saved_sse_state = _mm_getcsr(); } void LoadSIMDState() { _mm_setcsr(saved_sse_state); } void LoadDefaultSIMDState() { _mm_setcsr(default_sse_state); } }