/** * @file llv4math.h * @brief LLV4* class header file - vector processor enabled math * * $LicenseInfo:firstyear=2007&license=viewerlgpl$ * Second Life Viewer Source Code * Copyright (C) 2010, Linden Research, Inc. * * This library is free software; you can redistribute it and/or * modify it under the terms of the GNU Lesser General Public * License as published by the Free Software Foundation; * version 2.1 of the License only. * * This library is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * Lesser General Public License for more details. * * You should have received a copy of the GNU Lesser General Public * License along with this library; if not, write to the Free Software * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA * * Linden Research, Inc., 945 Battery Street, San Francisco, CA 94111 USA * $/LicenseInfo$ */ #ifndef LL_LLV4MATH_H #define LL_LLV4MATH_H // *NOTE: We do not support SSE acceleration on Windows builds. // Our minimum specification for the viewer includes 1 GHz Athlon processors, // which covers the Athlon Thunderbird series that does not support SSE. // // Our header files include statements like this // const F32 HAVOK_TIMESTEP = 1.f / 45.f; // This creates "globals" that are included in each .obj file. If a single // .cpp file has SSE code generation turned on (eg, llviewerjointmesh_sse.cpp) // these globals will be initialized using SSE instructions. This causes SL // to crash before main() on processors without SSE. Untangling all these // headers/variables is too much work for the small performance gains of // vectorization. // // Therefore we only support vectorization on builds where the everything is // built with SSE or Altivec. See https://jira.secondlife.com/browse/VWR-1610 // and https://jira.lindenlab.com/browse/SL-47720 for details. // // Sorry the code is such a mess. JC //----------------------------------------------------------------------------- //----------------------------------------------------------------------------- // LLV4MATH - GNUC //----------------------------------------------------------------------------- //----------------------------------------------------------------------------- #if LL_GNUC && __GNUC__ >= 4 && __SSE__ #define LL_VECTORIZE 1 #if LL_DARWIN #include <Accelerate/Accelerate.h> #include <xmmintrin.h> typedef vFloat V4F32; #else #include <xmmintrin.h> typedef float V4F32 __attribute__((vector_size(16))); #endif #endif #if LL_GNUC #define LL_LLV4MATH_ALIGN_PREFIX #define LL_LLV4MATH_ALIGN_POSTFIX __attribute__((aligned(16))) #endif //----------------------------------------------------------------------------- //----------------------------------------------------------------------------- // LLV4MATH - MSVC //----------------------------------------------------------------------------- //----------------------------------------------------------------------------- // Only vectorize if the entire Windows build uses SSE. // _M_IX86_FP is set when SSE code generation is turned on, and I have // confirmed this in VS2003, VS2003 SP1, and VS2005. JC #if LL_MSVC && _M_IX86_FP #define LL_VECTORIZE 1 #include <xmmintrin.h> typedef __m128 V4F32; #endif #if LL_MSVC #define LL_LLV4MATH_ALIGN_PREFIX __declspec(align(16)) #define LL_LLV4MATH_ALIGN_POSTFIX #endif //----------------------------------------------------------------------------- //----------------------------------------------------------------------------- // LLV4MATH - default - no vectorization //----------------------------------------------------------------------------- //----------------------------------------------------------------------------- #if !LL_VECTORIZE #define LL_VECTORIZE 0 struct V4F32 { F32 __pad__[4]; }; inline F32 llv4lerp(F32 a, F32 b, F32 w) { return ( b - a ) * w + a; } #endif #ifndef LL_LLV4MATH_ALIGN_PREFIX # define LL_LLV4MATH_ALIGN_PREFIX #endif #ifndef LL_LLV4MATH_ALIGN_POSTFIX # define LL_LLV4MATH_ALIGN_POSTFIX #endif //----------------------------------------------------------------------------- //----------------------------------------------------------------------------- // LLV4MATH //----------------------------------------------------------------------------- //----------------------------------------------------------------------------- #define LLV4_NUM_AXIS 4 class LLV4Vector3; class LLV4Matrix3; class LLV4Matrix4; #endif