css_enhanced_waf/particles/particle_sort.cpp
FluorescentCIAAfricanAmerican 3bf9df6b27 1
2020-04-22 12:56:21 -04:00

194 lines
5.5 KiB
C++

//========= Copyright Valve Corporation, All rights reserved. ============//
//
// Purpose: particle system code
//
//===========================================================================//
#include <algorithm>
#include "tier0/platform.h"
#include "tier0/vprof.h"
#include "particles/particles.h"
#include "psheet.h"
// memdbgon must be the last include file in a .cpp file!!!
#include "tier0/memdbgon.h"
static ALIGN16 ParticleRenderData_t s_SortedIndexList[MAX_PARTICLES_IN_A_SYSTEM] ALIGN16_POST;
enum EParticleSortKeyType
{
SORT_KEY_NONE,
SORT_KEY_DISTANCE,
SORT_KEY_CREATION_TIME,
};
template<EParticleSortKeyType eSortKeyMode> void s_GenerateData( Vector CameraPos, CParticleVisibilityData *pVisibilityData, CParticleCollection *pParticles )
{
fltx4 *pOutUnSorted = reinterpret_cast<fltx4 *>( s_SortedIndexList );
C4VAttributeIterator pXYZ( PARTICLE_ATTRIBUTE_XYZ, pParticles );
CM128AttributeIterator pCreationTimeStamp( PARTICLE_ATTRIBUTE_CREATION_TIME, pParticles );
CM128AttributeIterator pAlpha( PARTICLE_ATTRIBUTE_ALPHA, pParticles );
CM128AttributeIterator pAlpha2( PARTICLE_ATTRIBUTE_ALPHA2, pParticles );
CM128AttributeIterator pRadius( PARTICLE_ATTRIBUTE_RADIUS, pParticles );
int nParticles = pParticles->m_nActiveParticles;
FourVectors EyePos;
EyePos.DuplicateVector( CameraPos );
fltx4 fl4AlphaVis = ReplicateX4( pVisibilityData->m_flAlphaVisibility );
fltx4 fl4RadVis = ReplicateX4( pVisibilityData->m_flRadiusVisibility );
// indexing. We will generate the index as float and use magicf2i to convert to integer
fltx4 fl4OutIdx = g_SIMD_0123; // 0 1 2 3
fl4OutIdx = AddSIMD( fl4OutIdx, Four_2ToThe23s); // fix as int
bool bUseVis = pVisibilityData->m_bUseVisibility;
bool bCameraBias = pVisibilityData->m_flCameraBias != 0.0f;
fltx4 fl4Bias = ReplicateX4( pVisibilityData->m_flCameraBias );
fltx4 fl4AlphaScale = ReplicateX4( 255.0 );
do
{
fltx4 fl4X = pXYZ->x;
fltx4 fl4Y = pXYZ->y;
fltx4 fl4Z = pXYZ->z;
fltx4 fl4SortKey;
if ( eSortKeyMode == SORT_KEY_DISTANCE )
{
fltx4 Xdiff = SubSIMD( EyePos.x, fl4X );
fltx4 Ydiff = SubSIMD( EyePos.y, fl4Y );
fltx4 Zdiff = SubSIMD( EyePos.z, fl4Z );
if ( bCameraBias )
{
FourVectors v4CameraBias;
v4CameraBias.x = Xdiff;
v4CameraBias.y = Ydiff;
v4CameraBias.z = Zdiff;
//v4CameraBias = VectorNormalizeFast( v4CameraBias );
v4CameraBias.VectorNormalizeFast();
v4CameraBias *= fl4Bias;
fl4X = SubSIMD( fl4X, v4CameraBias.x );
fl4Y = SubSIMD( fl4Y, v4CameraBias.y );
fl4Z = SubSIMD( fl4Z, v4CameraBias.z );
Xdiff = SubSIMD( EyePos.x, fl4X );
Ydiff = SubSIMD( EyePos.y, fl4Y );
Zdiff = SubSIMD( EyePos.z, fl4Z );
}
fl4SortKey = AddSIMD( MulSIMD( Xdiff, Xdiff ),
AddSIMD( MulSIMD( Ydiff, Ydiff ),
MulSIMD( Zdiff, Zdiff ) ) );
}
else
{
Assert ( eSortKeyMode == SORT_KEY_CREATION_TIME || eSortKeyMode == SORT_KEY_NONE );
fl4SortKey = *pCreationTimeStamp;
}
fltx4 fl4FinalAlpha = MulSIMD( *pAlpha, *pAlpha2 );
fltx4 fl4FinalRadius = *pRadius;
if ( bUseVis )
{
fl4FinalAlpha = MaxSIMD ( Four_Zeros, MinSIMD( Four_Ones, MulSIMD( fl4FinalAlpha, fl4AlphaVis) ) );
fl4FinalRadius = MulSIMD( fl4FinalRadius, fl4RadVis );
}
// convert float 0..1 to int 0..255
fl4FinalAlpha = AddSIMD( MulSIMD( fl4FinalAlpha, fl4AlphaScale ), Four_2ToThe23s );
// now, we will use simd transpose to write the output
fltx4 i4Indices = AndSIMD( fl4OutIdx, LoadAlignedSIMD( (float *) g_SIMD_Low16BitsMask ) );
TransposeSIMD( fl4SortKey, i4Indices, fl4FinalRadius, fl4FinalAlpha );
pOutUnSorted[0] = fl4SortKey;
pOutUnSorted[1] = i4Indices;
pOutUnSorted[2] = fl4FinalRadius;
pOutUnSorted[3] = fl4FinalAlpha;
pOutUnSorted += 4;
fl4OutIdx = AddSIMD( fl4OutIdx, Four_Fours );
nParticles -= 4;
++pXYZ;
++pAlpha;
++pAlpha2;
++pRadius;
} while( nParticles > 0 ); // we're not called with 0
}
#define TREATASINT(x) ( *( ( (int32 const *)( &(x) ) ) ) )
static bool SortLessFunc( const ParticleRenderData_t &left, const ParticleRenderData_t &right )
{
return TREATASINT( left.m_flSortKey ) < TREATASINT( right.m_flSortKey );
}
void CParticleCollection::GenerateSortedIndexList( Vector vecCamera, CParticleVisibilityData *pVisibilityData, bool bSorted )
{
VPROF_BUDGET( "CParticleCollection::GenerateSortedIndexList", VPROF_BUDGETGROUP_PARTICLE_RENDERING );
if ( bSorted )
{
s_GenerateData<SORT_KEY_DISTANCE>( vecCamera, pVisibilityData, this );
}
else
s_GenerateData<SORT_KEY_NONE>( vecCamera, pVisibilityData, this );
// check data
#if 0
bool bBad = false;
for( int i = 0; i < m_nActiveParticles; i++ )
{
Assert( s_SortedIndexList[i].m_nIndex == i );
if ( s_SortedIndexList[i].m_nIndex != i )
bBad = true;
}
if ( bBad )
{
s_GenerateData<SORT_KEY_NONE>( vecCamera, pVisibilityData, this );
}
#endif
#ifndef SWDS
if ( bSorted )
{
// sort the output in place
std::make_heap( s_SortedIndexList, s_SortedIndexList + m_nActiveParticles, SortLessFunc );
std::sort_heap( s_SortedIndexList, s_SortedIndexList + m_nActiveParticles, SortLessFunc );
}
#endif
}
const ParticleRenderData_t *CParticleCollection::GetRenderList( IMatRenderContext *pRenderContext, bool bSorted, int *pNparticles, CParticleVisibilityData *pVisibilityData)
{
if ( bSorted )
bSorted = m_pDef->m_bShouldSort;
Vector vecCamera;
pRenderContext->GetWorldSpaceCameraPosition( &vecCamera );
*pNparticles = m_nActiveParticles;
GenerateSortedIndexList( vecCamera, pVisibilityData, bSorted );
return s_SortedIndexList+m_nActiveParticles;
}