From 86aad47b0418b1715a4d223adf8f59aa92619d15 Mon Sep 17 00:00:00 2001 From: notaz Date: Sun, 2 Jan 2011 00:59:02 +0200 Subject: import gpu_unai from PCSX4ALL project --- plugins/gpu_unai/gpu_fixedpoint.h | 129 ++++++++++++++++++++++++++++++++++++++ 1 file changed, 129 insertions(+) create mode 100644 plugins/gpu_unai/gpu_fixedpoint.h (limited to 'plugins/gpu_unai/gpu_fixedpoint.h') diff --git a/plugins/gpu_unai/gpu_fixedpoint.h b/plugins/gpu_unai/gpu_fixedpoint.h new file mode 100644 index 0000000..03f07d2 --- /dev/null +++ b/plugins/gpu_unai/gpu_fixedpoint.h @@ -0,0 +1,129 @@ +/*************************************************************************** + * Copyright (C) 2010 PCSX4ALL Team * + * Copyright (C) 2010 Unai * + * * + * This program is free software; you can redistribute it and/or modify * + * it under the terms of the GNU General Public License as published by * + * the Free Software Foundation; either version 2 of the License, or * + * (at your option) any later version. * + * * + * This program is distributed in the hope that it will be useful, * + * but WITHOUT ANY WARRANTY; without even the implied warranty of * + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * + * GNU General Public License for more details. * + * * + * You should have received a copy of the GNU General Public License * + * along with this program; if not, write to the * + * Free Software Foundation, Inc., * + * 51 Franklin Street, Fifth Floor, Boston, MA 02111-1307 USA. * + ***************************************************************************/ + +#ifndef FIXED_H +#define FIXED_H + +typedef s32 fixed; + +#ifdef GPU_TABLE_10_BITS +#define TABLE_BITS 10 +#else +#define TABLE_BITS 16 +#endif + +#define FIXED_BITS 16 + +#define fixed_ZERO ((fixed)0) +#define fixed_ONE ((fixed)1<>1)) + +// big precision inverse table. +s32 s_invTable[(1<>FIXED_BITS); } + +/* +INLINE u32 Log2(u32 _a) +{ + u32 c = 0; // result of log2(v) will go here + if (_a & 0xFFFF0000) { _a >>= 16; c |= 16; } + if (_a & 0xFF00) { _a >>= 8; c |= 8; } + if (_a & 0xF0) { _a >>= 4; c |= 4; } + if (_a & 0xC) { _a >>= 2; c |= 2; } + if (_a & 0x2) { _a >>= 1; c |= 1; } + return c; +} +*/ + +#ifdef __arm__ +INLINE u32 Log2(u32 x) { u32 res; asm("clz %0,%1" : "=r" (res) : "r" (x)); return 32-res; } +#else +INLINE u32 Log2(u32 x) { u32 i = 0; for ( ; x > 0; ++i, x >>= 1); return i - 1; } +#endif + +#ifdef GPU_TABLE_10_BITS +INLINE void xInv (const fixed _b, s32& iFactor_, s32& iShift_) +{ + u32 uD = (_b<0) ? -_b : _b ; + u32 uLog = Log2(uD); + uLog = uLog>(TABLE_BITS-1) ? uLog-(TABLE_BITS-1) : 0; + u32 uDen = uD>>uLog; + iFactor_ = s_invTable[uDen]; + iFactor_ = (_b<0) ? -iFactor_ :iFactor_; + iShift_ = 15+uLog; +} +#else +INLINE void xInv (const fixed _b, s32& iFactor_, s32& iShift_) +{ + u32 uD = (_b<0) ? -_b : _b; + if(uD>1) + { + u32 uLog = Log2(uD); + uLog = uLog>(TABLE_BITS-1) ? uLog-(TABLE_BITS-1) : 0; + u32 uDen = (uD>>uLog)-1; + iFactor_ = s_invTable[uDen]; + iFactor_ = (_b<0) ? -iFactor_ :iFactor_; + iShift_ = 15+uLog; + } + else + { + iFactor_=_b; + iShift_ = 0; + } +} +#endif + +INLINE fixed xInvMulx (const fixed _a, const s32 _iFact, const s32 _iShift) +{ + #ifdef __arm__ + s64 res; + asm ("smull %Q0, %R0, %1, %2" : "=&r" (res) : "r"(_a) , "r"(_iFact)); + return fixed(res>>_iShift); + #else + return fixed( ((s64)(_a)*(s64)(_iFact))>>(_iShift) ); + #endif +} + +INLINE fixed xLoDivx (const fixed _a, const fixed _b) +{ + s32 iFact, iShift; + xInv(_b, iFact, iShift); + return xInvMulx(_a, iFact, iShift); +} + +/////////////////////////////////////////////////////////////////////////// +template +INLINE T Min2 (const T _a, const T _b) { return (_a<_b)?_a:_b; } + +template +INLINE T Min3 (const T _a, const T _b, const T _c) { return Min2(Min2(_a,_b),_c); } + +/////////////////////////////////////////////////////////////////////////// +template +INLINE T Max2 (const T _a, const T _b) { return (_a>_b)?_a:_b; } + +template +INLINE T Max3 (const T _a, const T _b, const T _c) { return Max2(Max2(_a,_b),_c); } + +/////////////////////////////////////////////////////////////////////////// +#endif //FIXED_H -- cgit v1.2.3