523 lines
15 KiB
C++
523 lines
15 KiB
C++
//========= Copyright <20> 1996-2005, Valve Corporation, All rights reserved. ============//
|
||
//
|
||
// Purpose: Defines a symbol table
|
||
//
|
||
// $Header: $
|
||
// $NoKeywords: $
|
||
//=============================================================================//
|
||
|
||
#pragma warning (disable:4514)
|
||
|
||
#include "utlsymbol.h"
|
||
#include "tier0/threadtools.h"
|
||
#include "stringpool.h"
|
||
#include "generichash.h"
|
||
#include "tier0/vprof.h"
|
||
#include <stddef.h>
|
||
|
||
// memdbgon must be the last include file in a .cpp file!!!
|
||
#include "tier0/memdbgon.h"
|
||
|
||
#define INVALID_STRING_INDEX CStringPoolIndex( 0xFFFF, 0xFFFF )
|
||
|
||
#define MIN_STRING_POOL_SIZE 2048
|
||
|
||
//-----------------------------------------------------------------------------
|
||
// globals
|
||
//-----------------------------------------------------------------------------
|
||
|
||
CUtlSymbolTableMT* CUtlSymbol::s_pSymbolTable = 0;
|
||
bool CUtlSymbol::s_bAllowStaticSymbolTable = true;
|
||
|
||
|
||
//-----------------------------------------------------------------------------
|
||
// symbol methods
|
||
//-----------------------------------------------------------------------------
|
||
|
||
void CUtlSymbol::Initialize()
|
||
{
|
||
// If this assert fails, then the module that this call is in has chosen to disallow
|
||
// use of the static symbol table. Usually, it's to prevent confusion because it's easy
|
||
// to accidentally use the global symbol table when you really want to use a specific one.
|
||
Assert( s_bAllowStaticSymbolTable );
|
||
|
||
// necessary to allow us to create global symbols
|
||
static bool symbolsInitialized = false;
|
||
if (!symbolsInitialized)
|
||
{
|
||
s_pSymbolTable = new CUtlSymbolTableMT;
|
||
symbolsInitialized = true;
|
||
}
|
||
}
|
||
|
||
void CUtlSymbol::LockTableForRead()
|
||
{
|
||
Initialize();
|
||
s_pSymbolTable->LockForRead();
|
||
}
|
||
|
||
void CUtlSymbol::UnlockTableForRead()
|
||
{
|
||
s_pSymbolTable->UnlockForRead();
|
||
}
|
||
|
||
//-----------------------------------------------------------------------------
|
||
// Purpose: Singleton to delete table on exit from module
|
||
//-----------------------------------------------------------------------------
|
||
class CCleanupUtlSymbolTable
|
||
{
|
||
public:
|
||
~CCleanupUtlSymbolTable()
|
||
{
|
||
delete CUtlSymbol::s_pSymbolTable;
|
||
CUtlSymbol::s_pSymbolTable = NULL;
|
||
}
|
||
};
|
||
|
||
static CCleanupUtlSymbolTable g_CleanupSymbolTable;
|
||
|
||
CUtlSymbolTableMT* CUtlSymbol::CurrTable()
|
||
{
|
||
Initialize();
|
||
return s_pSymbolTable;
|
||
}
|
||
|
||
|
||
//-----------------------------------------------------------------------------
|
||
// string->symbol->string
|
||
//-----------------------------------------------------------------------------
|
||
|
||
CUtlSymbol::CUtlSymbol( const char* pStr )
|
||
{
|
||
m_Id = CurrTable()->AddString( pStr );
|
||
}
|
||
|
||
const char* CUtlSymbol::String( ) const
|
||
{
|
||
return CurrTable()->String(m_Id);
|
||
}
|
||
|
||
const char* CUtlSymbol::StringNoLock( ) const
|
||
{
|
||
return CurrTable()->StringNoLock(m_Id);
|
||
}
|
||
|
||
void CUtlSymbol::DisableStaticSymbolTable()
|
||
{
|
||
s_bAllowStaticSymbolTable = false;
|
||
}
|
||
|
||
//-----------------------------------------------------------------------------
|
||
// checks if the symbol matches a string
|
||
//-----------------------------------------------------------------------------
|
||
|
||
bool CUtlSymbol::operator==( const char* pStr ) const
|
||
{
|
||
if (m_Id == UTL_INVAL_SYMBOL)
|
||
return false;
|
||
return strcmp( String(), pStr ) == 0;
|
||
}
|
||
|
||
|
||
|
||
//-----------------------------------------------------------------------------
|
||
// symbol table stuff
|
||
//-----------------------------------------------------------------------------
|
||
inline const char* CUtlSymbolTable::DecoratedStringFromIndex( const CStringPoolIndex &index ) const
|
||
{
|
||
Assert( index.m_iPool < m_StringPools.Count() );
|
||
Assert( index.m_iOffset < m_StringPools[index.m_iPool]->m_TotalLen );
|
||
|
||
// step over the hash decorating the beginning of the string
|
||
return (&m_StringPools[index.m_iPool]->m_Data[index.m_iOffset]);
|
||
}
|
||
|
||
inline const char* CUtlSymbolTable::StringFromIndex( const CStringPoolIndex &index ) const
|
||
{
|
||
// step over the hash decorating the beginning of the string
|
||
return DecoratedStringFromIndex(index)+sizeof(hashDecoration_t);
|
||
}
|
||
|
||
// The first two bytes of each string in the pool are actually the hash for that string.
|
||
// Thus we compare hashes rather than entire strings for a significant perf benefit.
|
||
// However since there is a high rate of hash collision we must still compare strings
|
||
// if the hashes match.
|
||
bool CUtlSymbolTable::CLess::operator()( const CStringPoolIndex &i1, const CStringPoolIndex &i2 ) const
|
||
{
|
||
// Need to do pointer math because CUtlSymbolTable is used in CUtlVectors, and hence
|
||
// can be arbitrarily moved in memory on a realloc. Yes, this is portable. In reality,
|
||
// right now at least, because m_LessFunc is the first member of CUtlRBTree, and m_Lookup
|
||
// is the first member of CUtlSymbolTabke, this == pTable
|
||
CUtlSymbolTable *pTable = (CUtlSymbolTable *)( (byte *)this - offsetof(CUtlSymbolTable::CTree, m_LessFunc) ) - offsetof(CUtlSymbolTable, m_Lookup );
|
||
|
||
#if 1 // using the hashes
|
||
const char *str1, *str2;
|
||
hashDecoration_t hash1, hash2;
|
||
|
||
if (i1 == INVALID_STRING_INDEX)
|
||
{
|
||
str1 = pTable->m_pUserSearchString;
|
||
hash1 = pTable->m_nUserSearchStringHash;
|
||
}
|
||
else
|
||
{
|
||
str1 = pTable->DecoratedStringFromIndex( i1 );
|
||
hashDecoration_t storedHash = *reinterpret_cast<const hashDecoration_t *>(str1);
|
||
str1 += sizeof(hashDecoration_t);
|
||
AssertMsg2( storedHash == ( !pTable->m_bInsensitive ? HashString(str1) : HashStringCaseless(str1) ),
|
||
"The stored hash (%d) for symbol %s is not correct.", storedHash, str1 );
|
||
hash1 = storedHash;
|
||
}
|
||
|
||
if (i2 == INVALID_STRING_INDEX)
|
||
{
|
||
str2 = pTable->m_pUserSearchString;
|
||
hash2 = pTable->m_nUserSearchStringHash;
|
||
}
|
||
else
|
||
{
|
||
str2 = pTable->DecoratedStringFromIndex( i2 );
|
||
hashDecoration_t storedHash = *reinterpret_cast<const hashDecoration_t *>(str2);
|
||
str2 += sizeof(hashDecoration_t);
|
||
AssertMsg2( storedHash == ( !pTable->m_bInsensitive ? HashString(str2) : HashStringCaseless(str2) ),
|
||
"The stored hash (%d) for symbol '%s' is not correct.", storedHash, str2 );
|
||
hash2 = storedHash;
|
||
}
|
||
|
||
// compare the hashes
|
||
if ( hash1 == hash2 )
|
||
{
|
||
if ( !str1 && str2 )
|
||
return 1;
|
||
if ( !str2 && str1 )
|
||
return -1;
|
||
if ( !str1 && !str2 )
|
||
return 0;
|
||
|
||
// if the hashes match compare the strings
|
||
if ( !pTable->m_bInsensitive )
|
||
return strcmp( str1, str2 ) < 0;
|
||
else
|
||
return V_stricmp( str1, str2 ) < 0;
|
||
}
|
||
else
|
||
{
|
||
return hash1 < hash2;
|
||
}
|
||
|
||
#else // not using the hashes, just comparing strings
|
||
const char* str1 = (i1 == INVALID_STRING_INDEX) ? pTable->m_pUserSearchString :
|
||
pTable->StringFromIndex( i1 );
|
||
const char* str2 = (i2 == INVALID_STRING_INDEX) ? pTable->m_pUserSearchString :
|
||
pTable->StringFromIndex( i2 );
|
||
|
||
if ( !str1 && str2 )
|
||
return 1;
|
||
if ( !str2 && str1 )
|
||
return -1;
|
||
if ( !str1 && !str2 )
|
||
return 0;
|
||
if ( !pTable->m_bInsensitive )
|
||
return strcmp( str1, str2 ) < 0;
|
||
else
|
||
return strcmpi( str1, str2 ) < 0;
|
||
#endif
|
||
}
|
||
|
||
|
||
//-----------------------------------------------------------------------------
|
||
// constructor, destructor
|
||
//-----------------------------------------------------------------------------
|
||
CUtlSymbolTable::CUtlSymbolTable( int growSize, int initSize, bool caseInsensitive ) :
|
||
m_Lookup( growSize, initSize ), m_bInsensitive( caseInsensitive ), m_StringPools( 8 )
|
||
{
|
||
}
|
||
|
||
CUtlSymbolTable::~CUtlSymbolTable()
|
||
{
|
||
// Release the stringpool string data
|
||
RemoveAll();
|
||
}
|
||
|
||
|
||
CUtlSymbol CUtlSymbolTable::Find( const char* pString ) const
|
||
{
|
||
VPROF( "CUtlSymbol::Find" );
|
||
if (!pString)
|
||
return CUtlSymbol();
|
||
|
||
// Store a special context used to help with insertion
|
||
m_pUserSearchString = pString;
|
||
m_nUserSearchStringHash = m_bInsensitive ? HashStringCaseless(pString) : HashString(pString) ;
|
||
|
||
// Passing this special invalid symbol makes the comparison function
|
||
// use the string passed in the context
|
||
UtlSymId_t idx = m_Lookup.Find( INVALID_STRING_INDEX );
|
||
|
||
#ifdef _DEBUG
|
||
m_pUserSearchString = NULL;
|
||
m_nUserSearchStringHash = 0;
|
||
#endif
|
||
|
||
return CUtlSymbol( idx );
|
||
}
|
||
|
||
|
||
int CUtlSymbolTable::FindPoolWithSpace( int len ) const
|
||
{
|
||
for ( int i=0; i < m_StringPools.Count(); i++ )
|
||
{
|
||
StringPool_t *pPool = m_StringPools[i];
|
||
|
||
if ( (pPool->m_TotalLen - pPool->m_SpaceUsed) >= len )
|
||
{
|
||
return i;
|
||
}
|
||
}
|
||
|
||
return -1;
|
||
}
|
||
|
||
|
||
//-----------------------------------------------------------------------------
|
||
// Finds and/or creates a symbol based on the string
|
||
//-----------------------------------------------------------------------------
|
||
|
||
CUtlSymbol CUtlSymbolTable::AddString( const char* pString )
|
||
{
|
||
VPROF("CUtlSymbol::AddString");
|
||
if (!pString)
|
||
return CUtlSymbol( UTL_INVAL_SYMBOL );
|
||
|
||
CUtlSymbol id = Find( pString );
|
||
|
||
if (id.IsValid())
|
||
return id;
|
||
|
||
int lenString = strlen(pString) + 1; // length of just the string
|
||
int lenDecorated = lenString + sizeof(hashDecoration_t); // and with its hash decoration
|
||
// make sure that all strings are aligned on 2-byte boundaries so the hashes will read correctly
|
||
COMPILE_TIME_ASSERT(sizeof(hashDecoration_t) == 2);
|
||
lenDecorated = (lenDecorated + 1) & (~0x01); // round up to nearest multiple of 2
|
||
|
||
// Find a pool with space for this string, or allocate a new one.
|
||
int iPool = FindPoolWithSpace( lenDecorated );
|
||
if ( iPool == -1 )
|
||
{
|
||
// Add a new pool.
|
||
int newPoolSize = MAX( lenDecorated + sizeof( StringPool_t ), MIN_STRING_POOL_SIZE );
|
||
StringPool_t *pPool = (StringPool_t*)malloc( newPoolSize );
|
||
pPool->m_TotalLen = newPoolSize - sizeof( StringPool_t );
|
||
pPool->m_SpaceUsed = 0;
|
||
iPool = m_StringPools.AddToTail( pPool );
|
||
}
|
||
|
||
// Compute a hash
|
||
hashDecoration_t hash = m_bInsensitive ? HashStringCaseless(pString) : HashString(pString) ;
|
||
|
||
// Copy the string in.
|
||
StringPool_t *pPool = m_StringPools[iPool];
|
||
Assert( pPool->m_SpaceUsed < 0xFFFF ); // This should never happen, because if we had a string > 64k, it
|
||
// would have been given its entire own pool.
|
||
|
||
unsigned short iStringOffset = pPool->m_SpaceUsed;
|
||
const char *startingAddr = &pPool->m_Data[pPool->m_SpaceUsed];
|
||
|
||
// store the hash at the head of the string
|
||
*((hashDecoration_t *)(startingAddr)) = hash;
|
||
// and then the string's data
|
||
memcpy( (void *)(startingAddr + sizeof(hashDecoration_t)), pString, lenString );
|
||
pPool->m_SpaceUsed += lenDecorated;
|
||
|
||
// insert the string into the vector.
|
||
CStringPoolIndex index;
|
||
index.m_iPool = iPool;
|
||
index.m_iOffset = iStringOffset;
|
||
|
||
MEM_ALLOC_CREDIT();
|
||
UtlSymId_t idx = m_Lookup.Insert( index );
|
||
return CUtlSymbol( idx );
|
||
}
|
||
|
||
|
||
//-----------------------------------------------------------------------------
|
||
// Look up the string associated with a particular symbol
|
||
//-----------------------------------------------------------------------------
|
||
|
||
const char* CUtlSymbolTable::String( CUtlSymbol id ) const
|
||
{
|
||
if (!id.IsValid())
|
||
return "";
|
||
|
||
Assert( m_Lookup.IsValidIndex((UtlSymId_t)id) );
|
||
return StringFromIndex( m_Lookup[id] );
|
||
}
|
||
|
||
|
||
//-----------------------------------------------------------------------------
|
||
// Remove all symbols in the table.
|
||
//-----------------------------------------------------------------------------
|
||
|
||
void CUtlSymbolTable::RemoveAll()
|
||
{
|
||
m_Lookup.Purge();
|
||
|
||
for ( int i=0; i < m_StringPools.Count(); i++ )
|
||
free( m_StringPools[i] );
|
||
|
||
m_StringPools.RemoveAll();
|
||
}
|
||
|
||
|
||
//-----------------------------------------------------------------------------
|
||
// Purpose:
|
||
// Input : *pFileName -
|
||
// Output : FileNameHandle_t
|
||
//-----------------------------------------------------------------------------
|
||
FileNameHandle_t CUtlFilenameSymbolTable::FindOrAddFileName( const char *pFileName )
|
||
{
|
||
if ( !pFileName )
|
||
{
|
||
return NULL;
|
||
}
|
||
|
||
// find first
|
||
FileNameHandle_t hFileName = FindFileName( pFileName );
|
||
if ( hFileName )
|
||
{
|
||
return hFileName;
|
||
}
|
||
|
||
// Fix slashes+dotslashes and make lower case first..
|
||
char fn[ MAX_PATH ];
|
||
Q_strncpy( fn, pFileName, sizeof( fn ) );
|
||
Q_RemoveDotSlashes( fn );
|
||
#ifdef _WIN32
|
||
strlwr( fn );
|
||
#endif
|
||
|
||
// Split the filename into constituent parts
|
||
char basepath[ MAX_PATH ];
|
||
Q_ExtractFilePath( fn, basepath, sizeof( basepath ) );
|
||
char filename[ MAX_PATH ];
|
||
Q_strncpy( filename, fn + Q_strlen( basepath ), sizeof( filename ) );
|
||
|
||
// not found, lock and look again
|
||
FileNameHandleInternal_t handle;
|
||
m_lock.LockForWrite();
|
||
handle.SetPath( m_PathStringPool.FindStringHandle( basepath ) );
|
||
handle.SetFile( m_FileStringPool.FindStringHandle( filename ) );
|
||
if ( handle.GetPath() && handle.GetFile() )
|
||
{
|
||
// found
|
||
m_lock.UnlockWrite();
|
||
return *( FileNameHandle_t * )( &handle );
|
||
}
|
||
|
||
// safely add it
|
||
handle.SetPath( m_PathStringPool.ReferenceStringHandle( basepath ) );
|
||
handle.SetFile( m_FileStringPool.ReferenceStringHandle( filename ) );
|
||
m_lock.UnlockWrite();
|
||
|
||
return *( FileNameHandle_t * )( &handle );
|
||
}
|
||
|
||
FileNameHandle_t CUtlFilenameSymbolTable::FindFileName( const char *pFileName )
|
||
{
|
||
if ( !pFileName )
|
||
{
|
||
return NULL;
|
||
}
|
||
|
||
// Fix slashes+dotslashes and make lower case first..
|
||
char fn[ MAX_PATH ];
|
||
Q_strncpy( fn, pFileName, sizeof( fn ) );
|
||
Q_RemoveDotSlashes( fn );
|
||
#ifdef _WIN32
|
||
strlwr( fn );
|
||
#endif
|
||
|
||
// Split the filename into constituent parts
|
||
char basepath[ MAX_PATH ];
|
||
Q_ExtractFilePath( fn, basepath, sizeof( basepath ) );
|
||
char filename[ MAX_PATH ];
|
||
Q_strncpy( filename, fn + Q_strlen( basepath ), sizeof( filename ) );
|
||
|
||
FileNameHandleInternal_t handle;
|
||
|
||
m_lock.LockForRead();
|
||
handle.SetPath( m_PathStringPool.FindStringHandle( basepath ) );
|
||
handle.SetFile( m_FileStringPool.FindStringHandle( filename ) );
|
||
m_lock.UnlockRead();
|
||
|
||
|
||
if ( ( handle.GetPath() == 0 ) || ( handle.GetFile() == 0 ) )
|
||
return NULL;
|
||
|
||
return *( FileNameHandle_t * )( &handle );
|
||
}
|
||
|
||
//-----------------------------------------------------------------------------
|
||
// Purpose:
|
||
// Input : handle -
|
||
// Output : const char
|
||
//-----------------------------------------------------------------------------
|
||
bool CUtlFilenameSymbolTable::String( const FileNameHandle_t& handle, char *buf, int buflen )
|
||
{
|
||
buf[ 0 ] = 0;
|
||
|
||
FileNameHandleInternal_t *internalFileHandle = ( FileNameHandleInternal_t * )&handle;
|
||
if ( !internalFileHandle )
|
||
{
|
||
return false;
|
||
}
|
||
|
||
m_lock.LockForRead();
|
||
const char *path = m_PathStringPool.HandleToString( internalFileHandle->GetPath() );
|
||
const char *fn = m_FileStringPool.HandleToString( internalFileHandle->GetFile() );
|
||
m_lock.UnlockRead();
|
||
|
||
if ( !path || !fn )
|
||
{
|
||
return false;
|
||
}
|
||
|
||
Q_strncpy( buf, path, buflen );
|
||
Q_strncat( buf, fn, buflen, COPY_ALL_CHARACTERS );
|
||
|
||
return true;
|
||
}
|
||
|
||
void CUtlFilenameSymbolTable::RemoveAll()
|
||
{
|
||
m_PathStringPool.FreeAll();
|
||
m_FileStringPool.FreeAll();
|
||
}
|
||
|
||
void CUtlFilenameSymbolTable::SpewStrings()
|
||
{
|
||
m_lock.LockForRead();
|
||
m_PathStringPool.SpewStrings();
|
||
m_FileStringPool.SpewStrings();
|
||
m_lock.UnlockRead();
|
||
}
|
||
|
||
bool CUtlFilenameSymbolTable::SaveToBuffer( CUtlBuffer &buffer )
|
||
{
|
||
m_lock.LockForRead();
|
||
bool bResult = m_PathStringPool.SaveToBuffer( buffer );
|
||
bResult = bResult && m_FileStringPool.SaveToBuffer( buffer );
|
||
m_lock.UnlockRead();
|
||
|
||
return bResult;
|
||
}
|
||
|
||
bool CUtlFilenameSymbolTable::RestoreFromBuffer( CUtlBuffer &buffer )
|
||
{
|
||
m_lock.LockForWrite();
|
||
bool bResult = m_PathStringPool.RestoreFromBuffer( buffer );
|
||
bResult = bResult && m_FileStringPool.RestoreFromBuffer( buffer );
|
||
m_lock.UnlockWrite();
|
||
|
||
return bResult;
|
||
}
|