/indra/llmath/llv4math.h
C Header | 141 lines | 42 code | 33 blank | 66 comment | 3 complexity | 8efa25a98abd70ad61a122ad3127e954 MD5 | raw file
Possible License(s): LGPL-2.1
- /**
- * @file llv4math.h
- * @brief LLV4* class header file - vector processor enabled math
- *
- * $LicenseInfo:firstyear=2007&license=viewerlgpl$
- * Second Life Viewer Source Code
- * Copyright (C) 2010, Linden Research, Inc.
- *
- * This library is free software; you can redistribute it and/or
- * modify it under the terms of the GNU Lesser General Public
- * License as published by the Free Software Foundation;
- * version 2.1 of the License only.
- *
- * This library is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
- * Lesser General Public License for more details.
- *
- * You should have received a copy of the GNU Lesser General Public
- * License along with this library; if not, write to the Free Software
- * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
- *
- * Linden Research, Inc., 945 Battery Street, San Francisco, CA 94111 USA
- * $/LicenseInfo$
- */
- #ifndef LL_LLV4MATH_H
- #define LL_LLV4MATH_H
- // *NOTE: We do not support SSE acceleration on Windows builds.
- // Our minimum specification for the viewer includes 1 GHz Athlon processors,
- // which covers the Athlon Thunderbird series that does not support SSE.
- //
- // Our header files include statements like this
- // const F32 HAVOK_TIMESTEP = 1.f / 45.f;
- // This creates "globals" that are included in each .obj file. If a single
- // .cpp file has SSE code generation turned on (eg, llviewerjointmesh_sse.cpp)
- // these globals will be initialized using SSE instructions. This causes SL
- // to crash before main() on processors without SSE. Untangling all these
- // headers/variables is too much work for the small performance gains of
- // vectorization.
- //
- // Therefore we only support vectorization on builds where the everything is
- // built with SSE or Altivec. See https://jira.secondlife.com/browse/VWR-1610
- // and https://jira.lindenlab.com/browse/SL-47720 for details.
- //
- // Sorry the code is such a mess. JC
- //-----------------------------------------------------------------------------
- //-----------------------------------------------------------------------------
- // LLV4MATH - GNUC
- //-----------------------------------------------------------------------------
- //-----------------------------------------------------------------------------
- #if LL_GNUC && __GNUC__ >= 4 && __SSE__
- #define LL_VECTORIZE 1
- #if LL_DARWIN
- #include <Accelerate/Accelerate.h>
- #include <xmmintrin.h>
- typedef vFloat V4F32;
- #else
- #include <xmmintrin.h>
- typedef float V4F32 __attribute__((vector_size(16)));
- #endif
- #endif
- #if LL_GNUC
- #define LL_LLV4MATH_ALIGN_PREFIX
- #define LL_LLV4MATH_ALIGN_POSTFIX __attribute__((aligned(16)))
- #endif
- //-----------------------------------------------------------------------------
- //-----------------------------------------------------------------------------
- // LLV4MATH - MSVC
- //-----------------------------------------------------------------------------
- //-----------------------------------------------------------------------------
- // Only vectorize if the entire Windows build uses SSE.
- // _M_IX86_FP is set when SSE code generation is turned on, and I have
- // confirmed this in VS2003, VS2003 SP1, and VS2005. JC
- #if LL_MSVC && _M_IX86_FP
- #define LL_VECTORIZE 1
- #include <xmmintrin.h>
- typedef __m128 V4F32;
- #endif
- #if LL_MSVC
- #define LL_LLV4MATH_ALIGN_PREFIX __declspec(align(16))
- #define LL_LLV4MATH_ALIGN_POSTFIX
- #endif
- //-----------------------------------------------------------------------------
- //-----------------------------------------------------------------------------
- // LLV4MATH - default - no vectorization
- //-----------------------------------------------------------------------------
- //-----------------------------------------------------------------------------
- #if !LL_VECTORIZE
- #define LL_VECTORIZE 0
- struct V4F32 { F32 __pad__[4]; };
- inline F32 llv4lerp(F32 a, F32 b, F32 w) { return ( b - a ) * w + a; }
- #endif
- #ifndef LL_LLV4MATH_ALIGN_PREFIX
- # define LL_LLV4MATH_ALIGN_PREFIX
- #endif
- #ifndef LL_LLV4MATH_ALIGN_POSTFIX
- # define LL_LLV4MATH_ALIGN_POSTFIX
- #endif
- //-----------------------------------------------------------------------------
- //-----------------------------------------------------------------------------
- // LLV4MATH
- //-----------------------------------------------------------------------------
- //-----------------------------------------------------------------------------
- #define LLV4_NUM_AXIS 4
- class LLV4Vector3;
- class LLV4Matrix3;
- class LLV4Matrix4;
- #endif