diff options
Diffstat (limited to 'indra/newview/llpolymesh.cpp')
| -rw-r--r-- | indra/newview/llpolymesh.cpp | 52 | 
1 files changed, 33 insertions, 19 deletions
| diff --git a/indra/newview/llpolymesh.cpp b/indra/newview/llpolymesh.cpp index d5a2d66bcf..d10e4fee3a 100644 --- a/indra/newview/llpolymesh.cpp +++ b/indra/newview/llpolymesh.cpp @@ -35,7 +35,8 @@  //-----------------------------------------------------------------------------  #include "llviewerprecompiledheaders.h" -#include "llpolymesh.h" +#include "llfasttimer.h" +#include "llmemory.h"  #include "llviewercontrol.h"  #include "llxmltree.h" @@ -45,7 +46,7 @@  #include "llvolume.h"  #include "llendianswizzle.h" -#include "llfasttimer.h" +#include "llpolymesh.h"  #define HEADER_ASCII "Linden Mesh 1.0"  #define HEADER_BINARY "Linden Binary Mesh 1.0" @@ -140,7 +141,7 @@ void LLPolyMeshSharedData::freeMeshData()  		delete [] mDetailTexCoords;  		mDetailTexCoords = NULL; -		delete [] mWeights; +		ll_aligned_free_16(mWeights);  		mWeights = NULL;  	} @@ -230,7 +231,7 @@ BOOL LLPolyMeshSharedData::allocateVertexData( U32 numVertices )  	mBaseBinormals = new LLVector3[ numVertices ];  	mTexCoords = new LLVector2[ numVertices ];  	mDetailTexCoords = new LLVector2[ numVertices ]; -	mWeights = new F32[ numVertices ]; +	mWeights = (F32*) ll_aligned_malloc_16((numVertices*sizeof(F32)+0xF) & ~0xF);  	for (i = 0; i < numVertices; i++)  	{  		mWeights[i] = 0.f; @@ -708,20 +709,29 @@ LLPolyMesh::LLPolyMesh(LLPolyMeshSharedData *shared_data, LLPolyMesh *reference_  		mClothingWeights = reference_mesh->mClothingWeights;  	}  	else -	{ +	{ 	   #if 1	// Allocate memory without initializing every vector  		// NOTE: This makes asusmptions about the size of LLVector[234]  		int nverts = mSharedData->mNumVertices; -		int nfloats = nverts * (3*5 + 2 + 4); -		mVertexData = new F32[nfloats]; +		int nfloats = nverts * (2*4 + 3*3 + 2 + 4); + +		//use aligned vertex data to make LLPolyMesh SSE friendly +		mVertexData = (F32*) ll_aligned_malloc_16(nfloats*4);  		int offset = 0; -		mCoords = 				(LLVector3*)(mVertexData + offset); offset += 3*nverts; -		mNormals = 				(LLVector3*)(mVertexData + offset); offset += 3*nverts; -		mScaledNormals = 		(LLVector3*)(mVertexData + offset); offset += 3*nverts; -		mBinormals = 			(LLVector3*)(mVertexData + offset); offset += 3*nverts; -		mScaledBinormals = 		(LLVector3*)(mVertexData + offset); offset += 3*nverts; -		mTexCoords = 			(LLVector2*)(mVertexData + offset); offset += 2*nverts; -		mClothingWeights = 	(LLVector4*)(mVertexData + offset); offset += 4*nverts; + +		//all members must be 16-byte aligned except the last 3 +		mCoords				= 	(LLVector4*)(mVertexData + offset); offset += 4*nverts; +		mNormals			=	(LLVector4*)(mVertexData + offset); offset += 4*nverts; +		mClothingWeights	= 	(LLVector4*)(mVertexData + offset); offset += 4*nverts; +		mTexCoords			= 	(LLVector2*)(mVertexData + offset); offset += 2*nverts; + +		// these members don't need to be 16-byte aligned, but the first one might be +		// read during an aligned memcpy of mTexCoords +		mScaledNormals		=	(LLVector3*)(mVertexData + offset); offset += 3*nverts; +		mBinormals			=	(LLVector3*)(mVertexData + offset); offset += 3*nverts; +		mScaledBinormals	=	(LLVector3*)(mVertexData + offset); offset += 3*nverts; +		 +		  #else  		mCoords = new LLVector3[mSharedData->mNumVertices];  		mNormals = new LLVector3[mSharedData->mNumVertices]; @@ -757,7 +767,7 @@ LLPolyMesh::~LLPolyMesh()  	delete [] mClothingWeights;  	delete [] mTexCoords;  #else -	delete [] mVertexData; +	ll_aligned_free_16(mVertexData);  #endif  } @@ -864,7 +874,7 @@ void LLPolyMesh::dumpDiagInfo()  //-----------------------------------------------------------------------------  // getWritableCoords()  //----------------------------------------------------------------------------- -LLVector3 *LLPolyMesh::getWritableCoords() +LLVector4 *LLPolyMesh::getWritableCoords()  {  	return mCoords;  } @@ -872,7 +882,7 @@ LLVector3 *LLPolyMesh::getWritableCoords()  //-----------------------------------------------------------------------------  // getWritableNormals()  //----------------------------------------------------------------------------- -LLVector3 *LLPolyMesh::getWritableNormals() +LLVector4 *LLPolyMesh::getWritableNormals()  {  	return mNormals;  } @@ -927,8 +937,12 @@ void LLPolyMesh::initializeForMorph()  	if (!mSharedData)  		return; -	memcpy(mCoords, mSharedData->mBaseCoords, sizeof(LLVector3) * mSharedData->mNumVertices);	/*Flawfinder: ignore*/ -	memcpy(mNormals, mSharedData->mBaseNormals, sizeof(LLVector3) * mSharedData->mNumVertices);	/*Flawfinder: ignore*/ +	for (U32 i = 0; i < mSharedData->mNumVertices; ++i) +	{ +		mCoords[i] = LLVector4(mSharedData->mBaseCoords[i]); +		mNormals[i] = LLVector4(mSharedData->mBaseNormals[i]); +	} +  	memcpy(mScaledNormals, mSharedData->mBaseNormals, sizeof(LLVector3) * mSharedData->mNumVertices);	/*Flawfinder: ignore*/  	memcpy(mBinormals, mSharedData->mBaseBinormals, sizeof(LLVector3) * mSharedData->mNumVertices);	/*Flawfinder: ignore*/  	memcpy(mScaledBinormals, mSharedData->mBaseBinormals, sizeof(LLVector3) * mSharedData->mNumVertices);		/*Flawfinder: ignore*/ | 
