501 lines
19 KiB
C++
501 lines
19 KiB
C++
/**
|
|
* @file llskinningutil.cpp
|
|
* @brief Functions for mesh object skinning
|
|
* @author vir@lindenlab.com
|
|
*
|
|
* $LicenseInfo:firstyear=2015&license=viewerlgpl$
|
|
* Second Life Viewer Source Code
|
|
* Copyright (C) 2015, Linden Research, Inc.
|
|
*
|
|
* This library is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation;
|
|
* version 2.1 of the License only.
|
|
*
|
|
* This library is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with this library; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
*
|
|
* Linden Research, Inc., 945 Battery Street, San Francisco, CA 94111 USA
|
|
* $/LicenseInfo$
|
|
*/
|
|
|
|
#include "llviewerprecompiledheaders.h"
|
|
|
|
#include "llskinningutil.h"
|
|
#include "llvoavatar.h"
|
|
#include "llviewercontrol.h"
|
|
#include "llmeshrepository.h"
|
|
#include "llvolume.h"
|
|
#include "llrigginginfo.h"
|
|
|
|
void dump_avatar_and_skin_state(const std::string& reason, LLVOAvatar *avatar, const LLMeshSkinInfo *skin)
|
|
{
|
|
static S32 dump_count = 0;
|
|
const S32 max_dump = 10;
|
|
|
|
if (dump_count < max_dump)
|
|
{
|
|
LL_WARNS("Avatar") << avatar->getFullname() << " dumping, reason " << reason
|
|
<< " avatar build state: isBuilt() " << avatar->isBuilt()
|
|
<< " mInitFlags " << avatar->mInitFlags << LL_ENDL;
|
|
LL_WARNS("Avatar") << "Skin num joints " << skin->mJointNames.size() << " " << skin->mJointNums.size() << LL_ENDL;
|
|
LL_WARNS("Avatar") << "Skin scrubbed " << skin->mInvalidJointsScrubbed
|
|
<< " nums init " << skin->mJointNumsInitialized << LL_ENDL;
|
|
for (S32 j=0; j<skin->mJointNames.size(); j++)
|
|
{
|
|
LL_WARNS("Avatar") << "skin joint idx " << j << " name [" << skin->mJointNames[j]
|
|
<< "] num " << skin->mJointNums[j] << LL_ENDL;
|
|
//<FS:ND> Query by JointKey rather than just a string, the key can be a U32 index for faster lookup
|
|
//const std::string& name = skin->mJointNames[j];
|
|
const std::string& name = skin->mJointNames[j].mName;
|
|
// </FS:ND>
|
|
S32 joint_num = skin->mJointNums[j];
|
|
|
|
LLJoint *name_joint = avatar->getJoint(name);
|
|
LLJoint *num_joint = avatar->getJoint(joint_num);
|
|
if (!name_joint)
|
|
{
|
|
LL_WARNS("Avatar") << "failed to find joint by name" << LL_ENDL;
|
|
}
|
|
if (!num_joint)
|
|
{
|
|
LL_WARNS("Avatar") << "failed to find joint by num" << LL_ENDL;
|
|
}
|
|
if (num_joint != name_joint)
|
|
{
|
|
LL_WARNS("Avatar") << "joint pointers don't match" << LL_ENDL;
|
|
}
|
|
if (num_joint && num_joint->getJointNum() != joint_num)
|
|
{
|
|
LL_WARNS("Avatar") << "joint found by num has wrong num " << joint_num << "!=" << num_joint->getJointNum() << LL_ENDL;
|
|
}
|
|
if (name_joint && name_joint->getJointNum() != joint_num)
|
|
{
|
|
LL_WARNS("Avatar") << "joint found by name has wrong num " << joint_num << "!=" << name_joint->getJointNum() << LL_ENDL;
|
|
}
|
|
}
|
|
LL_WARNS("Avatar") << LL_ENDL;
|
|
|
|
dump_count++;
|
|
}
|
|
}
|
|
|
|
U32 LLSkinningUtil::getMaxJointCount()
|
|
{
|
|
U32 result = LL_MAX_JOINTS_PER_MESH_OBJECT;
|
|
return result;
|
|
}
|
|
|
|
U32 LLSkinningUtil::getMeshJointCount(const LLMeshSkinInfo *skin)
|
|
{
|
|
return llmin((U32)getMaxJointCount(), (U32)skin->mJointNames.size());
|
|
}
|
|
|
|
void LLSkinningUtil::scrubInvalidJoints(LLVOAvatar *avatar, LLMeshSkinInfo* skin)
|
|
{
|
|
if (skin->mInvalidJointsScrubbed)
|
|
{
|
|
return;
|
|
}
|
|
for (U32 j = 0; j < skin->mJointNames.size(); ++j)
|
|
{
|
|
// Fix invalid names to "mPelvis". Currently meshes with
|
|
// invalid names will be blocked on upload, so this is just
|
|
// needed for handling of any legacy bad data.
|
|
if (!avatar->getJoint(skin->mJointNames[j]))
|
|
{
|
|
//<FS:ND> Query by JointKey rather than just a string, the key can be a U32 index for faster lookup
|
|
//LL_DEBUGS("Avatar") << avatar->getFullname() << " mesh rigged to invalid joint " << skin->mJointNames[j] << LL_ENDL;
|
|
//LL_WARNS_ONCE("Avatar") << avatar->getFullname() << " mesh rigged to invalid joint" << skin->mJointNames[j] << LL_ENDL;
|
|
//skin->mJointNames[ j ] = "mPelvis";
|
|
LL_DEBUGS("Avatar") << avatar->getFullname() << " mesh rigged to invalid joint " << skin->mJointNames[j].mName << LL_ENDL;
|
|
LL_WARNS_ONCE("Avatar") << avatar->getFullname() << " mesh rigged to invalid joint" << skin->mJointNames[j].mName << LL_ENDL;
|
|
skin->mJointNames[ j ] = JointKey::construct( "mPelvis" );
|
|
//</FS:ND>
|
|
skin->mJointNumsInitialized = false; // force update after names change.
|
|
}
|
|
}
|
|
skin->mInvalidJointsScrubbed = true;
|
|
}
|
|
|
|
//<FS:Beq> Per frame SkinningMatrix Caching
|
|
//void LLSkinningUtil::initSkinningMatrixPalette(
|
|
// LLMatrix4* mat,
|
|
// S32 count,
|
|
// const LLMeshSkinInfo* skin,
|
|
// LLVOAvatar *avatar)
|
|
//{
|
|
// initJointNums(const_cast<LLMeshSkinInfo*>(skin), avatar);
|
|
// for (U32 j = 0; j < count; ++j)
|
|
// {
|
|
// LLJoint *joint = avatar->getJoint(skin->mJointNums[j]);
|
|
// if (joint)
|
|
// {
|
|
//#define MAT_USE_SSE
|
|
//#ifdef MAT_USE_SSE
|
|
// LLMatrix4a bind, world, res;
|
|
// bind.loadu(skin->mInvBindMatrix[j]);
|
|
// world.loadu(joint->getWorldMatrix());
|
|
// matMul(bind, world, res);
|
|
// memcpy(mat[j].mMatrix, res.mMatrix, 16 * sizeof(float));
|
|
//#else
|
|
// mat[j] = skin->mInvBindMatrix[j];
|
|
// mat[j] *= joint->getWorldMatrix();
|
|
//#endif
|
|
// }
|
|
// else
|
|
// {
|
|
// mat[j] = skin->mInvBindMatrix[j];
|
|
// // This shouldn't happen - in mesh upload, skinned
|
|
// // rendering should be disabled unless all joints are
|
|
// // valid. In other cases of skinned rendering, invalid
|
|
// // joints should already have been removed during scrubInvalidJoints().
|
|
// LL_WARNS_ONCE("Avatar") << avatar->getFullname()
|
|
// << " rigged to invalid joint name " << skin->mJointNames[j]
|
|
// << " num " << skin->mJointNums[j] << LL_ENDL;
|
|
// LL_WARNS_ONCE("Avatar") << avatar->getFullname()
|
|
// << " avatar build state: isBuilt() " << avatar->isBuilt()
|
|
// << " mInitFlags " << avatar->mInitFlags << LL_ENDL;
|
|
//#if 0
|
|
// dump_avatar_and_skin_state("initSkinningMatrixPalette joint not found", avatar, skin);
|
|
//#endif
|
|
// }
|
|
// }
|
|
//}
|
|
|
|
#ifndef LL_RELEASE_FOR_DOWNLOAD
|
|
static LLTrace::BlockTimerStatHandle FTM_SKINNING_INIT("Init Skinning Mats");
|
|
#endif
|
|
|
|
void LLSkinningUtil::initSkinningMatrixPalette(
|
|
LLMatrix4a* mat,
|
|
S32 count,
|
|
const LLMeshSkinInfo* skin,
|
|
LLVOAvatar *avatar)
|
|
{
|
|
#ifndef LL_RELEASE_FOR_DOWNLOAD
|
|
// This timer is too hot for normal use (though better now with caching)
|
|
LL_RECORD_BLOCK_TIME(FTM_SKINNING_INIT);
|
|
#endif
|
|
LLMatrix4a bind[LL_MAX_JOINTS_PER_MESH_OBJECT];
|
|
LLMatrix4a world[LL_MAX_JOINTS_PER_MESH_OBJECT];
|
|
|
|
initJointNums(const_cast<LLMeshSkinInfo*>(skin), avatar);
|
|
// TODO: Refactored to encourage the compiler to optimise better but it's too old and stubborn. Need to hand tool the SIMD.
|
|
// TODO: There are two overheads in this function casued by the unaligned loads. use Matrix4a
|
|
// TODO: getWorldMatrix forces a reverse recursion up through the skelly. Check if this is happening efficiently.
|
|
for (S32 j = 0; j < count; ++j)
|
|
{
|
|
LLJoint *joint = avatar->getJoint(skin->mJointNums[j]);
|
|
if (joint != nullptr){
|
|
bind[j].loadu(skin->mInvBindMatrix[j]);
|
|
world[j].loadu(joint->getWorldMatrix());
|
|
matMul(bind[j], world[j], mat[j]);
|
|
}
|
|
else
|
|
{
|
|
mat[j].loadu(skin->mInvBindMatrix[j]);
|
|
// This shouldn't happen - in mesh upload, skinned
|
|
// rendering should be disabled unless all joints are
|
|
// valid. In other cases of skinned rendering, invalid
|
|
// joints should already have been removed during scrubInvalidJoints().
|
|
// Beq note - Oct 2018 Animesh - Many rigged meshes still fail here. ('mElbowLeeft' typo in the rigging data)
|
|
LL_WARNS_ONCE("Avatar") << avatar->getFullname()
|
|
<< " rigged to invalid joint name " << skin->mJointNames[j]
|
|
<< " num " << skin->mJointNums[j] << LL_ENDL;
|
|
LL_WARNS_ONCE("Avatar") << avatar->getFullname()
|
|
<< " avatar build state: isBuilt() " << avatar->isBuilt()
|
|
<< " mInitFlags " << avatar->mInitFlags << LL_ENDL;
|
|
|
|
}
|
|
//LL_DEBUGS("Skinning") << "[" << avatar->getFullname() << "] joint(" << skin->mJointNames[j] << ") matices bind(" << bind << ") world(" << world << ")" << LL_ENDL;
|
|
}
|
|
}
|
|
//</FS:Beq>
|
|
|
|
void LLSkinningUtil::checkSkinWeights(LLVector4a* weights, U32 num_vertices, const LLMeshSkinInfo* skin)
|
|
{
|
|
#ifdef SHOW_ASSERT // same condition that controls llassert()
|
|
const S32 max_joints = skin->mJointNames.size();
|
|
for (U32 j=0; j<num_vertices; j++)
|
|
{
|
|
F32 *w = weights[j].getF32ptr();
|
|
|
|
F32 wsum = 0.0;
|
|
for (U32 k=0; k<4; ++k)
|
|
{
|
|
S32 i = llfloor(w[k]);
|
|
llassert(i>=0);
|
|
llassert(i<max_joints);
|
|
wsum += w[k]-i;
|
|
}
|
|
llassert(wsum > 0.0f);
|
|
}
|
|
#endif
|
|
}
|
|
|
|
void LLSkinningUtil::scrubSkinWeights(LLVector4a* weights, U32 num_vertices, const LLMeshSkinInfo* skin)
|
|
{
|
|
const S32 max_joints = skin->mJointNames.size();
|
|
for (U32 j=0; j<num_vertices; j++)
|
|
{
|
|
F32 *w = weights[j].getF32ptr();
|
|
|
|
for (U32 k=0; k<4; ++k)
|
|
{
|
|
S32 i = llfloor(w[k]);
|
|
F32 f = w[k]-i;
|
|
i = llclamp(i,0,max_joints-1);
|
|
w[k] = i + f;
|
|
}
|
|
}
|
|
checkSkinWeights(weights, num_vertices, skin);
|
|
}
|
|
|
|
void LLSkinningUtil::getPerVertexSkinMatrix(
|
|
F32* weights,
|
|
LLMatrix4a* mat,
|
|
bool handle_bad_scale,
|
|
LLMatrix4a& final_mat,
|
|
U32 max_joints)
|
|
{
|
|
bool valid_weights = true;
|
|
final_mat.clear();
|
|
|
|
S32 idx[4];
|
|
|
|
LLVector4 wght;
|
|
|
|
F32 scale = 0.f;
|
|
for (U32 k = 0; k < 4; k++)
|
|
{
|
|
F32 w = weights[k];
|
|
|
|
// BENTO potential optimizations
|
|
// - Do clamping in unpackVolumeFaces() (once instead of every time)
|
|
// - int vs floor: if we know w is
|
|
// >= 0.0, we can use int instead of floorf; the latter
|
|
// allegedly has a lot of overhead due to ieeefp error
|
|
// checking which we should not need.
|
|
idx[k] = llclamp((S32) floorf(w), (S32)0, (S32)max_joints-1);
|
|
|
|
wght[k] = w - floorf(w);
|
|
scale += wght[k];
|
|
}
|
|
if (handle_bad_scale && scale <= 0.f)
|
|
{
|
|
wght = LLVector4(1.0f, 0.0f, 0.0f, 0.0f);
|
|
valid_weights = false;
|
|
}
|
|
else
|
|
{
|
|
// This is enforced in unpackVolumeFaces()
|
|
llassert(scale>0.f);
|
|
wght *= 1.f/scale;
|
|
}
|
|
|
|
for (U32 k = 0; k < 4; k++)
|
|
{
|
|
F32 w = wght[k];
|
|
|
|
LLMatrix4a src;
|
|
src.setMul(mat[idx[k]], w);
|
|
|
|
final_mat.add(src);
|
|
}
|
|
// SL-366 - with weight validation/cleanup code, it should no longer be
|
|
// possible to hit the bad scale case.
|
|
llassert(valid_weights);
|
|
}
|
|
|
|
void LLSkinningUtil::initJointNums(LLMeshSkinInfo* skin, LLVOAvatar *avatar)
|
|
{
|
|
if (!skin->mJointNumsInitialized)
|
|
{
|
|
for (U32 j = 0; j < skin->mJointNames.size(); ++j)
|
|
{
|
|
LLJoint *joint = NULL;
|
|
if (skin->mJointNums[j] == -1)
|
|
{
|
|
joint = avatar->getJoint(skin->mJointNames[j]);
|
|
if (joint)
|
|
{
|
|
skin->mJointNums[j] = joint->getJointNum();
|
|
if (skin->mJointNums[j] < 0)
|
|
{
|
|
LL_WARNS_ONCE("Avatar") << avatar->getFullname() << " joint has unusual number " << skin->mJointNames[j] << ": " << skin->mJointNums[j] << LL_ENDL;
|
|
LL_WARNS_ONCE("Avatar") << avatar->getFullname() << " avatar build state: isBuilt() " << avatar->isBuilt() << " mInitFlags " << avatar->mInitFlags << LL_ENDL;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
LL_WARNS_ONCE("Avatar") << avatar->getFullname() << " unable to find joint " << skin->mJointNames[j] << LL_ENDL;
|
|
LL_WARNS_ONCE("Avatar") << avatar->getFullname() << " avatar build state: isBuilt() " << avatar->isBuilt() << " mInitFlags " << avatar->mInitFlags << LL_ENDL;
|
|
#if 0
|
|
dump_avatar_and_skin_state("initJointNums joint not found", avatar, skin);
|
|
#endif
|
|
}
|
|
}
|
|
}
|
|
skin->mJointNumsInitialized = true;
|
|
}
|
|
}
|
|
|
|
static LLTrace::BlockTimerStatHandle FTM_FACE_RIGGING_INFO("Face Rigging Info");
|
|
|
|
void LLSkinningUtil::updateRiggingInfo(const LLMeshSkinInfo* skin, LLVOAvatar *avatar, LLVolumeFace& vol_face)
|
|
{
|
|
LL_RECORD_BLOCK_TIME(FTM_FACE_RIGGING_INFO);
|
|
|
|
if (vol_face.mJointRiggingInfoTab.needsUpdate())
|
|
{
|
|
S32 num_verts = vol_face.mNumVertices;
|
|
if (num_verts>0 && vol_face.mWeights && (skin->mJointNames.size()>0))
|
|
{
|
|
initJointNums(const_cast<LLMeshSkinInfo*>(skin), avatar);
|
|
if (vol_face.mJointRiggingInfoTab.size()==0)
|
|
{
|
|
//std::set<S32> active_joints;
|
|
//S32 active_verts = 0;
|
|
vol_face.mJointRiggingInfoTab.resize(LL_CHARACTER_MAX_ANIMATED_JOINTS);
|
|
LLJointRiggingInfoTab &rig_info_tab = vol_face.mJointRiggingInfoTab;
|
|
for (S32 i=0; i<vol_face.mNumVertices; i++)
|
|
{
|
|
LLVector4a& pos = vol_face.mPositions[i];
|
|
F32 *weights = vol_face.mWeights[i].getF32ptr();
|
|
LLVector4 wght;
|
|
S32 idx[4];
|
|
F32 scale = 0.0f;
|
|
// FIXME unpacking of weights should be pulled into a common function and optimized if possible.
|
|
for (U32 k = 0; k < 4; k++)
|
|
{
|
|
F32 w = weights[k];
|
|
idx[k] = llclamp((S32) floorf(w), (S32)0, (S32)LL_CHARACTER_MAX_ANIMATED_JOINTS-1);
|
|
wght[k] = w - idx[k];
|
|
scale += wght[k];
|
|
}
|
|
if (scale > 0.0f)
|
|
{
|
|
for (U32 k=0; k<4; ++k)
|
|
{
|
|
wght[k] /= scale;
|
|
}
|
|
}
|
|
for (U32 k=0; k<4; ++k)
|
|
{
|
|
S32 joint_index = idx[k];
|
|
if (wght[k] > 0.0f)
|
|
{
|
|
S32 joint_num = skin->mJointNums[joint_index];
|
|
if (joint_num >= 0 && joint_num < LL_CHARACTER_MAX_ANIMATED_JOINTS)
|
|
{
|
|
rig_info_tab[joint_num].setIsRiggedTo(true);
|
|
|
|
// FIXME could precompute these matMuls.
|
|
LLMatrix4a bind_shape;
|
|
bind_shape.loadu(skin->mBindShapeMatrix);
|
|
LLMatrix4a inv_bind;
|
|
inv_bind.loadu(skin->mInvBindMatrix[joint_index]);
|
|
LLMatrix4a mat;
|
|
matMul(bind_shape, inv_bind, mat);
|
|
LLVector4a pos_joint_space;
|
|
mat.affineTransform(pos, pos_joint_space);
|
|
pos_joint_space.mul(wght[k]);
|
|
LLVector4a *extents = rig_info_tab[joint_num].getRiggedExtents();
|
|
update_min_max(extents[0], extents[1], pos_joint_space);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
//LL_DEBUGS("RigSpammish") << "built rigging info for vf " << &vol_face
|
|
// << " num_verts " << vol_face.mNumVertices
|
|
// << " active joints " << active_joints.size()
|
|
// << " active verts " << active_verts
|
|
// << LL_ENDL;
|
|
vol_face.mJointRiggingInfoTab.setNeedsUpdate(false);
|
|
}
|
|
}
|
|
if (vol_face.mJointRiggingInfoTab.size()!=0)
|
|
{
|
|
LL_DEBUGS("RigSpammish") << "we have rigging info for vf " << &vol_face
|
|
<< " num_verts " << vol_face.mNumVertices << LL_ENDL;
|
|
}
|
|
else
|
|
{
|
|
LL_DEBUGS("RigSpammish") << "no rigging info for vf " << &vol_face
|
|
<< " num_verts " << vol_face.mNumVertices << LL_ENDL;
|
|
}
|
|
|
|
}
|
|
}
|
|
|
|
// This is used for extracting rotation from a bind shape matrix that
|
|
// already has scales baked in
|
|
LLQuaternion LLSkinningUtil::getUnscaledQuaternion(const LLMatrix4& mat4)
|
|
{
|
|
LLMatrix3 bind_mat = mat4.getMat3();
|
|
for (auto i = 0; i < 3; i++)
|
|
{
|
|
F32 len = 0.0f;
|
|
for (auto j = 0; j < 3; j++)
|
|
{
|
|
len += bind_mat.mMatrix[i][j] * bind_mat.mMatrix[i][j];
|
|
}
|
|
if (len > 0.0f)
|
|
{
|
|
len = sqrt(len);
|
|
for (auto j = 0; j < 3; j++)
|
|
{
|
|
bind_mat.mMatrix[i][j] /= len;
|
|
}
|
|
}
|
|
}
|
|
bind_mat.invert();
|
|
LLQuaternion bind_rot = bind_mat.quaternion();
|
|
bind_rot.normalize();
|
|
return bind_rot;
|
|
}
|
|
|
|
namespace FSSkinningUtil
|
|
{
|
|
void getPerVertexSkinMatrixSSE( LLVector4a const &weights, LLMatrix4a* mat, bool handle_bad_scale, LLMatrix4a& final_mat, U32 max_joints )
|
|
{
|
|
final_mat.clear();
|
|
|
|
llassert_always( !handle_bad_scale );
|
|
|
|
LL_ALIGN_16( S32 idx[4] );
|
|
LL_ALIGN_16( F32 wght[4] );
|
|
|
|
__m128i _mMaxIdx = _mm_set_epi16( max_joints-1, max_joints-1, max_joints-1, max_joints-1, max_joints-1, max_joints-1, max_joints-1, max_joints-1 );
|
|
__m128i _mIdx = _mm_cvttps_epi32( (__m128)weights );
|
|
__m128 _mWeight = _mm_sub_ps( (__m128)weights, _mm_cvtepi32_ps( _mIdx ) );
|
|
|
|
_mIdx = _mm_min_epi16( _mIdx, _mMaxIdx );
|
|
_mm_store_si128( (__m128i*)idx, _mIdx );
|
|
|
|
__m128 _mScale = _mm_add_ps( _mWeight, _mm_movehl_ps( _mWeight, _mWeight ));
|
|
_mScale = _mm_add_ss( _mScale, _mm_shuffle_ps( _mScale, _mScale, 1) );
|
|
_mScale = _mm_shuffle_ps( _mScale, _mScale, 0 );
|
|
|
|
_mWeight = _mm_div_ps( _mWeight, _mScale );
|
|
_mm_store_ps( wght, _mWeight );
|
|
|
|
for (U32 k = 0; k < 4; k++)
|
|
{
|
|
F32 w = wght[k];
|
|
|
|
LLMatrix4a src;
|
|
src.setMul(mat[idx[k]], w);
|
|
|
|
final_mat.add(src);
|
|
}
|
|
}
|
|
}
|