tripwire-open-source/src/core/stringutil.cpp

347 lines
9.4 KiB
C++

//
// The developer of the original code and/or files is Tripwire, Inc.
// Portions created by Tripwire, Inc. are copyright (C) 2000-2019 Tripwire,
// Inc. Tripwire is a registered trademark of Tripwire, Inc. All rights
// reserved.
//
// This program is free software. The contents of this file are subject
// to the terms of the GNU General Public License as published by the
// Free Software Foundation; either version 2 of the License, or (at your
// option) any later version. You may redistribute it and/or modify it
// only in compliance with the GNU General Public License.
//
// This program is distributed in the hope that it will be useful.
// However, this program is distributed AS-IS WITHOUT ANY
// WARRANTY; INCLUDING THE IMPLIED WARRANTY OF MERCHANTABILITY OR FITNESS
// FOR A PARTICULAR PURPOSE. Please see the GNU General Public License
// for more details.
//
// You should have received a copy of the GNU General Public License
// along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307,
// USA.
//
// Nothing in the GNU General Public License or any other license to use
// the code or files shall permit you to use Tripwire's trademarks,
// service marks, or other intellectual property without Tripwire's
// prior written consent.
//
// If you have any questions, please contact Tripwire, Inc. at either
// info@tripwire.org or www.tripwire.org.
//
/*
* Name....: stringutil.cpp
* Date....: 09/02/99
* Creator.:
*
* This module implements the cStringUtil class and helpers. This class,
* primarily, is used to convert between various character formats. The
* supported formats include:
*
* NTWCS - using 32-bit wchar_t
* NTWCS - using 16-bit wchar_t
* NTMBS - using integral char's
*
* PLEASE NOTE:
* Refrain from using the StrToTStr, TStrToStr, WStrToTStr, and
* etc calls and instead use the type dispatched member:
*
* DestT::const_iterator Convert( DestT&, const SrcT& );
*
* It can be used like so:
*
* TSTRING tstr;
* TCOUT << cStringUtil::Convert( tstr, sUnknownType );
*
* This call makes our code more portable and extensible by not embedding
* type selection in the names of interfaces. For example:
*
* std::string s1 = cStringUtil::TStrToStr( TSTRING( "Huh" ) );
*
* Can be rewritten as:
*
* std::string s1;
* cStringUtil::Convert( s1, TSTRING( "Huh" ) );
*/
/// Requirements
#include "stdcore.h" // for: pch
#include "stringutil.h" // for: These Declarations
#include "debug.h" // for: Debugging Interface
#include "codeconvert.h" // for: iconv abstractions
#include "ntmbs.h" // for: eCharacterEncoding
#include "hashtable.h"
//- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
// String Cache
//- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
// TODO:BAM -- use these for mb -> UCS2 conversions as well?
class tss_hash_key_convert
{
public:
const uint8_t* operator()(const wc16_string& s, int* const pcbKeyLen)
{
*pcbKeyLen = sizeof(WCHAR16) * s.length();
return (uint8_t*)s.c_str();
}
};
class tss_hash_key_compare
{
public:
bool operator()(const wc16_string& lhs, const wc16_string& rhs)
{
return (lhs.compare(rhs) == 0);
}
};
namespace /* Module Local */
{
typedef cHashTable<wc16_string, TSTRING, tss_hash_key_compare, tss_hash_key_convert> hashtable_t;
hashtable_t& tss_GetHashTable()
{
static hashtable_t s_table;
return s_table;
}
} // namespace
inline void tss_insert_in_hash(const wc16_string& lhs, const TSTRING& rhs)
{
tss_GetHashTable().Insert(lhs, rhs);
}
inline bool tss_find_in_hash(const wc16_string& lhs, TSTRING& rhs)
{
return (tss_GetHashTable().Lookup(lhs, rhs));
}
//- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
// Type Dispatched Conversions
//- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
/*static*/
std::string::const_iterator cStringUtil::Convert(std::string& nbs, const wc16_string& dbs)
{
#if IS_AROS
nbs.resize(dbs.length());
for (int x = 0; x < dbs.length(); ++x)
nbs[x] = (unsigned char)dbs[x];
#else
cDebug d("cStringUtil::Convert( char, w16 )");
ASSERT((void*)nbs.c_str() != (void*)dbs.c_str());
if (dbs.empty())
nbs.erase();
else
{
if (tss_find_in_hash(dbs, nbs))
{
d.TraceNever(_T("found string in hash table\n"));
return nbs.begin();
}
else
{
d.TraceNever(_T("didn't find string in hash table\n"));
}
/*
d.TraceDebug( _T("converting: \n") );
for( int i = 0; i < dbs.size(); i++ )
d.TraceDebug( _T("0x%04X\n"), dbs[i] );
d.TraceDebug( _T("----\n") );
*/
nbs.resize(dbs.size() * MB_CUR_MAX);
int nWrote = iCodeConverter::GetInstance()->Convert(
(char*)nbs.c_str(), nbs.size(), dbs.c_str(), dbs.size()); // c_str() because must be null terminated
d.TraceDetail(_T("iCodeConverter returned %d\n"), nWrote);
if (nWrote == -1)
throw eCharacterEncoding(TSS_GetString(cCore, core::STR_ERR_BADCHAR));
nbs.resize(nWrote);
tss_insert_in_hash(dbs, nbs);
}
#endif
return nbs.begin();
}
/*static*/
wc16_string::const_iterator cStringUtil::Convert(wc16_string& dbs, const std::string& nbs)
{
#if IS_AROS
dbs.resize(nbs.length());
for (int x = 0; x < nbs.length(); x++)
dbs[x] = (unsigned short)nbs[x];
#else
cDebug d("cStringUtil::Convert( w16, char )");
if (nbs.size() != 0)
{
dbs.resize(nbs.size());
// d.TraceDebug( "converting <%s>\n", nbs.c_str() );
int nWrote = iCodeConverter::GetInstance()->Convert(
(WCHAR16*)dbs.c_str(), dbs.length(), nbs.c_str(), nbs.size()); // c_str() because must be null terminated
d.TraceDetail(_T("iCodeConverter returned %d\n"), nWrote);
if (nWrote == -1)
{
throw eCharacterEncoding(TSS_GetString(cCore, core::STR_ERR_BADCHAR));
}
dbs.resize(nWrote);
/*
d.TraceDebug( _T("converted to: \n") );
for( int i = 0; i < dbs.size(); i++ )
d.TraceDebug( _T("0x%04X\n"), dbs[i] );
d.TraceDebug( _T("----\n") );
*/
}
else
dbs.resize(0);
#endif
return dbs.begin();
}
#if SUPPORTS_WCHART && WCHAR_REP_IS_UCS2
/*static*/
std::wstring::const_iterator cStringUtil::Convert(std::wstring& wcs, const wc16_string& dbs)
{
if (dbs.size() != 0)
{
if (tss_find_in_hash(dbs, wcs))
return wcs.begin();
wcs.resize(dbs.size());
std::copy(dbs.begin(), dbs.end(), wcs.begin());
tss_insert_in_hash(dbs, wcs);
}
else
wcs.erase();
return wcs.begin();
}
/*static*/
wc16_string::const_iterator cStringUtil::Convert(wc16_string& dbs, const std::wstring& wcs)
{
if (wcs.size() != 0)
{
dbs.resize(wcs.size());
std::copy(wcs.begin(), wcs.end(), dbs.begin());
}
else
dbs.resize(0);
return dbs.begin();
}
/*static*/
std::wstring::const_iterator cStringUtil::Convert(std::wstring& wcs, const std::string& nbs)
{
if (nbs.size() != 0)
{
wcs.resize(nbs.size());
size_t nWrote = ::mbstowcs((wchar_t*)wcs.c_str(), nbs.c_str(), wcs.size() + 1);
if (nWrote == (size_t)-1)
throw eCharacterEncoding(TSS_GetString(cCore, core::STR_ERR_BADCHAR));
wcs.resize(nWrote);
}
else
wcs.erase();
return wcs.begin();
}
/*static*/
std::string::const_iterator cStringUtil::Convert(std::string& nbs, const std::wstring& wcs)
{
if (wcs.size() != 0)
{
if (tss_find_in_hash(wc16_string(wcs.c_str()), nbs))
return nbs.begin();
nbs.resize(MB_CUR_MAX * wcs.size());
size_t nWrote = ::wcstombs((char*)nbs.c_str(), wcs.c_str(), nbs.size() + 1);
if (nWrote == (size_t)-1)
throw eCharacterEncoding(TSS_GetString(cCore, core::STR_ERR_BADCHAR));
nbs.resize(nWrote);
tss_insert_in_hash(wc16_string(wcs.c_str()), nbs);
}
else
nbs.erase();
return nbs.begin();
}
#endif // SUPPORTS_WCHART && WCHAR_REP_IS_UCS2
/// TSTRING and Type Knowledge Required
///////////////////////////////////////////////////////////////////////////////
// TstrToStr
///////////////////////////////////////////////////////////////////////////////
std::string cStringUtil::TstrToStr(const TSTRING& tstr)
{
std::string s;
cStringUtil::Convert(s, tstr);
return s;
}
///////////////////////////////////////////////////////////////////////////////
// StrToTstr
///////////////////////////////////////////////////////////////////////////////
TSTRING cStringUtil::StrToTstr(const std::string& rhs)
{
TSTRING lhs;
cStringUtil::Convert(lhs, rhs);
return lhs;
}
///////////////////////////////////////////////////////////////////////////////
// WstrToTstr
///////////////////////////////////////////////////////////////////////////////
TSTRING cStringUtil::WstrToTstr(const wc16_string& rhs)
{
TSTRING lhs;
cStringUtil::Convert(lhs, rhs);
return lhs;
}
///////////////////////////////////////////////////////////////////////////////
// TstrToWstr
///////////////////////////////////////////////////////////////////////////////
wc16_string cStringUtil::TstrToWstr(const TSTRING& rhs)
{
wc16_string lhs;
cStringUtil::Convert(lhs, rhs);
return lhs;
}