solution to wxMBConv stuff - make a seperate XX2XX for strings of a specified length, use this in wxString instead of previous worst-case method

git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@30186 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775
This commit is contained in:
Ryan Norton 2004-10-30 20:16:25 +00:00
parent 9026d6fd7f
commit e4e3bbb447
4 changed files with 157 additions and 147 deletions

View File

@ -41,11 +41,18 @@ class WXDLLIMPEXP_BASE wxMBConv
public: public:
// the actual conversion takes place here // the actual conversion takes place here
// //
// note that n is the size of the output buffer, not the length of input // note that outputSize is the size of the output buffer, not the length of input
// (the latter is always supposed to be NUL-terminated) // (the latter is always supposed to be NUL-terminated)
virtual size_t MB2WC(wchar_t *outputBuf, const char *psz, size_t outputSize) const = 0; virtual size_t MB2WC(wchar_t *outputBuf, const char *psz, size_t outputSize) const = 0;
virtual size_t WC2MB(char *outputBuf, const wchar_t *psz, size_t outputSize) const = 0; virtual size_t WC2MB(char *outputBuf, const wchar_t *psz, size_t outputSize) const = 0;
// actual conversion for strings with embedded null characters
//
// outputSize is the size of the output buffer
// pszLen is the length of the input string (including all but last null character)
size_t MB2WC(wchar_t *outputBuf, const char *psz, size_t outputSize, size_t pszLen) const;
size_t WC2MB(char *outputBuf, const wchar_t *psz, size_t outputSize, size_t pszLen) const;
// MB <-> WC // MB <-> WC
const wxWCharBuffer cMB2WC(const char *psz) const; const wxWCharBuffer cMB2WC(const char *psz) const;
const wxCharBuffer cWC2MB(const wchar_t *psz) const; const wxCharBuffer cWC2MB(const wchar_t *psz) const;

View File

@ -1077,9 +1077,6 @@ public:
// the same as above, but takes a va_list // the same as above, but takes a va_list
static wxString FormatV(const wxChar *pszFormat, va_list argptr); static wxString FormatV(const wxChar *pszFormat, va_list argptr);
// returns the highest possible memory allocation for encoding
static size_t WorstEncodingCase(size_t len, const wxMBConv& conv);
// raw access to string memory // raw access to string memory
// ensure that string has space for at least nLen characters // ensure that string has space for at least nLen characters
// only works if the data of this string is not shared // only works if the data of this string is not shared

View File

@ -217,6 +217,94 @@ const wxCharBuffer wxMBConv::cWC2MB(const wchar_t *pwz) const
return buf; return buf;
} }
size_t wxMBConv::MB2WC(wchar_t* szBuffer, const char* szString,
size_t outsize, size_t nStringLen) const
{
const char* szEnd = szString + nStringLen + 1;
const char* szPos = szString;
const char* szStart = szPos;
size_t nActualLength = 0;
//Convert the string until the length() is reached, continuing the
//loop every time a null character is reached
while(szPos != szEnd)
{
wxASSERT(szPos < szEnd); //something is _really_ screwed up if this rings true
//Get the length of the current (sub)string
size_t nLen = MB2WC(NULL, szPos, 0);
//Invalid conversion?
if( nLen == (size_t)-1 )
return nLen;
//Increase the actual length (+1 for current null character)
nActualLength += nLen + 1;
//Only copy data in if buffer size is big enough
if (szBuffer != NULL &&
nActualLength <= outsize)
{
//Convert the current (sub)string
if ( MB2WC(&szBuffer[szPos - szStart], szPos, nLen + 1) == (size_t)-1 )
return (size_t)-1;
}
//Increment to next (sub)string
//Note that we have to use strlen here instead of nLen
//here because XX2XX gives us the size of the output buffer,
//not neccessarly the length of the string
szPos += strlen(szPos) + 1;
}
return nActualLength - 1; //success - return actual length
}
size_t wxMBConv::WC2MB(char* szBuffer, const wchar_t* szString,
size_t outsize, size_t nStringLen) const
{
const wchar_t* szEnd = szString + nStringLen + 1;
const wchar_t* szPos = szString;
const wchar_t* szStart = szPos;
size_t nActualLength = 0;
//Convert the string until the length() is reached, continuing the
//loop every time a null character is reached
while(szPos != szEnd)
{
wxASSERT(szPos < szEnd); //something is _really_ screwed up if this rings true
//Get the length of the current (sub)string
size_t nLen = WC2MB(NULL, szPos, 0);
//Invalid conversion?
if( nLen == (size_t)-1 )
return nLen;
//Increase the actual length (+1 for current null character)
nActualLength += nLen + 1;
//Only copy data in if buffer size is big enough
if (szBuffer != NULL &&
nActualLength <= outsize)
{
//Convert the current (sub)string
if(WC2MB(&szBuffer[szPos - szStart], szPos, nLen + 1) == (size_t)-1 )
return (size_t)-1;
}
//Increment to next (sub)string
//Note that we have to use wxWcslen here instead of nLen
//here because XX2XX gives us the size of the output buffer,
//not neccessarly the length of the string
szPos += wxWcslen(szPos) + 1;
}
return nActualLength - 1; //success - return actual length
}
// ---------------------------------------------------------------------------- // ----------------------------------------------------------------------------
// wxMBConvLibc // wxMBConvLibc
// ---------------------------------------------------------------------------- // ----------------------------------------------------------------------------
@ -2080,7 +2168,7 @@ public:
if (szOut == NULL) if (szOut == NULL)
{ {
// worst case // worst case
nRealOutSize = wxString::WorstEncodingCase(nBufSize - 1, *this)+1 ; nRealOutSize = ((nBufSize - 1) * 8) +1 ;
szBuffer = new char[ nRealOutSize ] ; szBuffer = new char[ nRealOutSize ] ;
} }
else else
@ -2257,7 +2345,7 @@ public:
if (buf == NULL) if (buf == NULL)
{ {
// worst case // worst case
n = wxString::WorstEncodingCase(byteInLen / SIZEOF_WCHAR_T, *this) + SIZEOF_WCHAR_T; n = ((byteInLen / SIZEOF_WCHAR_T) * 8) + SIZEOF_WCHAR_T;
tbuf = (char*) malloc( n ) ; tbuf = (char*) malloc( n ) ;
} }

View File

@ -984,126 +984,6 @@ int STRINGCLASS::compare(size_t nStart, size_t nLen,
// wxString class core // wxString class core
// =========================================================================== // ===========================================================================
// ---------------------------------------------------------------------------
// common conversion routines
// ---------------------------------------------------------------------------
size_t wxString::WorstEncodingCase(size_t len, const wxMBConv& WXUNUSED(conv))
{
//Worst case for UTF7
return len * 5;
}
#if wxUSE_WCHAR_T
//Convert a wide character string of a specified length
//to a multi-byte character string, ignoring intermittent null characters
//returns the actual length of the string
inline size_t wxMbstr(char* szBuffer, const wchar_t* szString,
size_t nStringLen, wxMBConv& conv)
{
const wchar_t* szEnd = szString + nStringLen + 1;
const wchar_t* szPos = szString;
const wchar_t* szStart = szPos;
size_t nActualLength = 0;
//Convert the string until the length() is reached, continuing the
//loop every time a null character is reached
while(szPos != szEnd)
{
wxASSERT(szPos < szEnd); //something is _really_ screwed up if this rings true
//Get the length of the current (sub)string
size_t nLen = conv.WC2MB(NULL, szPos, 0);
//Invalid conversion?
if( nLen == (size_t)-1 )
{
szBuffer[0] = '\0';
return 0;
}
//Increase the actual length (+1 for current null character)
nActualLength += nLen + 1;
//If this is true it means buffer overflow
wxASSERT( nActualLength <= wxString::WorstEncodingCase(nStringLen, conv) + 1 );
//Convert the current (sub)string
if(conv.WC2MB(&szBuffer[szPos - szStart], szPos, nLen + 1) == (size_t)-1 )
{
//error - return empty buffer
wxFAIL_MSG(wxT("Error converting wide-character string to a multi-byte string"));
szBuffer[0] = '\0';
return 0;
}
//Increment to next (sub)string
//Note that we have to use wxWcslen here instead of nLen
//here because XX2XX gives us the size of the output buffer,
//not neccessarly the length of the string
szPos += wxWcslen(szPos) + 1;
}
return nActualLength - 1; //success - return actual length
}
//Convert a multi-byte character string of a specified length
//to a wide character string, ignoring intermittent null characters
//returns the actual length
inline size_t wxWcstr( wchar_t* szBuffer, const char* szString,
size_t nStringLen, wxMBConv& conv)
{
const char* szEnd = szString + nStringLen + 1;
const char* szPos = szString;
const char* szStart = szPos;
size_t nActualLength = 0;
//Convert the string until the length() is reached, continuing the
//loop every time a null character is reached
while(szPos != szEnd)
{
wxASSERT(szPos < szEnd); //something is _really_ screwed up if this rings true
//Get the length of the current (sub)string
size_t nLen = conv.MB2WC(NULL, szPos, 0);
//Invalid conversion?
if( nLen == (size_t)-1 )
{
szBuffer[0] = '\0';
return 0;
}
//Increase the actual length (+1 for current null character)
nActualLength += nLen + 1;
//If this is true it means buffer overflow
wxASSERT(nActualLength <= nStringLen + 1);
//Convert the current (sub)string
if ( conv.MB2WC(&szBuffer[szPos - szStart], szPos, nLen + 1) == (size_t)-1 )
{
//error - return empty buffer
wxFAIL_MSG(wxT("Error converting multi-byte string to a wide-character string"));
szBuffer[0] = '\0';
return 0;
}
//Increment to next (sub)string
//Note that we have to use strlen here instead of nLen
//here because XX2XX gives us the size of the output buffer,
//not neccessarly the length of the string
szPos += strlen(szPos) + 1;
}
return nActualLength - 1; //success - return actual length
}
#endif //wxUSE_WCHAR_T
// --------------------------------------------------------------------------- // ---------------------------------------------------------------------------
// construction and conversion // construction and conversion
// --------------------------------------------------------------------------- // ---------------------------------------------------------------------------
@ -1143,28 +1023,48 @@ wxString::wxString(const char *psz, wxMBConv& conv, size_t nLength)
nLen = 0; nLen = 0;
} }
// anything to do? // anything to do?
if ( (nLen != 0) && (nLen != (size_t)-1) ) if ( (nLen != 0) && (nLen != (size_t)-1) )
{ {
//When converting mb->wc it never inflates to more characters than the length //Get length of converted string
wxStringBufferLength internalBuffer(*this, nLen + 1); size_t dwConvLen = conv.MB2WC(NULL, psz, 0, nLen);
//Do the actual conversion & Set the length of the buffer //if valid, do the conversion
internalBuffer.SetLength( if (dwConvLen != (size_t) -1)
wxWcstr(internalBuffer, psz, nLen, conv) {
); //Get internal buffer
wxStringBufferLength internalBuffer(*this, dwConvLen + 1);
//Do the actual conversion & Set the length of the buffer
internalBuffer.SetLength(
conv.MB2WC(internalBuffer, psz, dwConvLen + 1, nLen)
);
}
} }
} }
//Convert wxString in Unicode mode to a multi-byte string //Convert wxString in Unicode mode to a multi-byte string
const wxCharBuffer wxString::mb_str(wxMBConv& conv) const const wxCharBuffer wxString::mb_str(wxMBConv& conv) const
{ {
//Create the buffer //Get length of converted string
wxCharBuffer buffer( wxString::WorstEncodingCase(length(), conv) + 1); size_t dwConvLen = conv.WC2MB(NULL, (*this).c_str(), 0, length());
//Do the actual conversion (will return a blank string on error) //if valid, do the conversion
wxMbstr(buffer.data(), (*this).c_str(), length(), conv); if (dwConvLen != (size_t) -1)
{
//Create good buffer
wxCharBuffer buffer(dwConvLen + 1);
//Do the actual conversion
conv.WC2MB(buffer.data(), (*this).c_str(), dwConvLen + 1, length());
return buffer;
}
//create bogus buffer
wxCharBuffer buffer(1);
buffer.data()[0u] = 0;
return buffer; return buffer;
} }
@ -1207,14 +1107,20 @@ wxString::wxString(const wchar_t *pwz, wxMBConv& conv, size_t nLength)
// anything to do? // anything to do?
if ( (nLen != 0) && (nLen != (size_t)-1) ) if ( (nLen != 0) && (nLen != (size_t)-1) )
{ {
//Create a wxStringBufferLength which will access the internal //Get length of converted string
//C char pointer in non-stl mode size_t dwConvLen = conv.WC2MB(NULL, pwz, 0, nLen);
wxStringBufferLength internalBuffer(*this, wxString::WorstEncodingCase(nLen, conv) + 1);
//Do the actual conversion & Set the length of the buffer //if valid, do the conversion
internalBuffer.SetLength( if (dwConvLen != (size_t) -1)
wxMbstr(internalBuffer, pwz, nLen, conv) {
); //Get internal buffer
wxStringBufferLength internalBuffer(*this, dwConvLen + 1);
//Do the actual conversion & Set the length of the buffer
internalBuffer.SetLength(
conv.WC2MB(*this, pwz, dwConvLen + 1, nLen)
);
}
} }
} }
@ -1222,12 +1128,24 @@ wxString::wxString(const wchar_t *pwz, wxMBConv& conv, size_t nLength)
//mode is not enabled and wxUSE_WCHAR_T is enabled //mode is not enabled and wxUSE_WCHAR_T is enabled
const wxWCharBuffer wxString::wc_str(wxMBConv& conv) const const wxWCharBuffer wxString::wc_str(wxMBConv& conv) const
{ {
//mb->wc never inflates to more than the length //Get length of converted string
wxWCharBuffer buffer(length() + 1); size_t dwConvLen = conv.MB2WC(NULL, (*this).c_str(), 0, length());
//Do the actual conversion (will return a blank string on error) //if valid, do the conversion
wxWcstr(buffer.data(), (*this).c_str(), length(), conv); if (dwConvLen != (size_t) -1)
{
//Create good buffer
wxWCharBuffer buffer(dwConvLen + 1);
//Do the actual conversion
conv.MB2WC(buffer.data(), (*this).c_str(), dwConvLen + 1, length());
return buffer;
}
//create bogus buffer
wxWCharBuffer buffer(1);
buffer.data()[0u] = 0;
return buffer; return buffer;
} }