initialize wxStringBuffer with the original contents of wxString it was created from for better compatibility with the old, non-STL, build (this avoids problems such as ticket #4845); add wxString::tchar_buf() to help with the implementation

git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@53995 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775
2008-06-06 21:19:23 +00:00 · 2008-06-06 21:19:23 +00:00 · 062dc5fc22
commit 062dc5fc22
parent 1bc8210593
3 changed files with 231 additions and 68 deletions
--- a/include/wx/string.h
+++ b/include/wx/string.h
@ -65,6 +65,11 @@ class WXDLLIMPEXP_FWD_BASE wxString;
    #define WXWIN_COMPATIBILITY_STRING_PTR_AS_ITER 1
 #endif

+namespace wxPrivate
+{
+    template <typename T> struct wxStringAsBufHelper;
+}
+
 // ---------------------------------------------------------------------------
 // macros
 // ---------------------------------------------------------------------------
@ -1211,6 +1216,30 @@ public:
        { return mb_str(conv); }
    wxWritableWCharBuffer wchar_str() const { return wc_str(); }

+    // conversion to the buffer of the given type T (= char or wchar_t) and
+    // also optionally return the buffer length
+    //
+    // this is mostly/only useful for the template functions
+    //
+    // FIXME-VC6: the second argument only exists for VC6 which doesn't support
+    //            explicit template function selection, do not use it unless
+    //            you must support VC6!
+    template <typename T>
+    wxCharTypeBuffer<T> tchar_str(size_t *len = NULL,
+                                  T * WXUNUSED(dummy) = NULL) const
+    {
+#if wxUSE_UNICODE
+        // we need a helper dispatcher depending on type
+        return wxPrivate::wxStringAsBufHelper<T>::Get(*this, len);
+#else // ANSI
+        // T can only be char in ANSI build
+        if ( len )
+            *len = length();
+
+        return wxCharTypeBuffer<T>::CreateNonOwned(wx_str());
+#endif // Unicode build kind
+    }
+
    // conversion to/from plain (i.e. 7 bit) ASCII: this is useful for
    // converting numbers or strings which are certain not to contain special
    // chars (typically system functions, X atoms, environment variables etc.)
@ -1259,6 +1288,10 @@ public:
    }
    const char* utf8_str() const { return wx_str(); }
    const char* ToUTF8() const { return wx_str(); }
+
+    // this function exists in UTF-8 build only and returns the length of the
+    // internal UTF-8 representation
+    size_t utf8_length() const { return m_impl.length(); }
 #elif wxUSE_UNICODE_WCHAR
    static wxString FromUTF8(const char *utf8)
      { return wxString(utf8, wxMBConvUTF8()); }
@ -2715,6 +2748,67 @@ inline wxString operator+(wchar_t ch, const wxString& string)

 #define wxGetEmptyString() wxString()

+// ----------------------------------------------------------------------------
+// helper functions which couldn't be defined inline
+// ----------------------------------------------------------------------------
+
+namespace wxPrivate
+{
+
+#if wxUSE_UNICODE_WCHAR
+
+template <>
+struct wxStringAsBufHelper<char>
+{
+    static wxCharBuffer Get(const wxString& s, size_t *len)
+    {
+        wxCharBuffer buf(s.mb_str());
+        if ( len )
+            *len = buf ? strlen(buf) : 0;
+        return buf;
+    }
+};
+
+template <>
+struct wxStringAsBufHelper<wchar_t>
+{
+    static wxWCharBuffer Get(const wxString& s, size_t *len)
+    {
+        if ( len )
+            *len = s.length();
+        return wxWCharBuffer::CreateNonOwned(s.wx_str());
+    }
+};
+
+#elif wxUSE_UNICODE_UTF8
+
+template <>
+struct wxStringAsBufHelper<char>
+{
+    static wxCharBuffer Get(const wxString& s, size_t *len)
+    {
+        if ( len )
+            *len = s.utf8_length();
+        return wxCharBuffer::CreateNonOwned(s.wx_str());
+    }
+};
+
+template <>
+struct wxStringAsBufHelper<wchar_t>
+{
+    static wxWCharBuffer Get(const wxString& s, size_t *len)
+    {
+        wxWCharBuffer wbuf(s.wc_str());
+        if ( len )
+            *len = wxWcslen(wbuf);
+        return wbuf;
+    }
+};
+
+#endif // Unicode build kind
+
+} // namespace wxPrivate
+
 // ----------------------------------------------------------------------------
 // wxStringBuffer: a tiny class allowing to get a writable pointer into string
 // ----------------------------------------------------------------------------
@ -2782,8 +2876,30 @@ public:

    wxStringTypeBufferBase(wxString& str, size_t lenWanted = 1024)
        : m_str(str), m_buf(lenWanted)
-        { }
+    {
+        // for compatibility with old wxStringBuffer which provided direct
+        // access to wxString internal buffer, initialize ourselves with the
+        // string initial contents

+        // FIXME-VC6: remove the ugly (CharType *)NULL and use normal
+        //            tchar_str<CharType>
+        size_t len;
+        const wxCharTypeBuffer<CharType> buf(str.tchar_str(&len, (CharType *)NULL));
+        if ( buf )
+        {
+            if ( len > lenWanted )
+            {
+                // in this case there is not enough space for terminating NUL,
+                // ensure that we still put it there
+                m_buf.data()[lenWanted] = 0;
+                len = lenWanted - 1;
+            }
+
+            wxTmemcpy(m_buf.data(), buf, len + 1);
+        }
+        //else: conversion failed, this can happen when trying to get Unicode
+        //      string contents into a char string
+    }

    operator CharType*() { return m_buf.data(); }

@ -2794,22 +2910,25 @@ protected:

 template<typename T>
 class WXDLLIMPEXP_BASE wxStringTypeBufferLengthBase
+    : public wxStringTypeBufferBase<T>
 {
 public:
-    typedef T CharType;
-
    wxStringTypeBufferLengthBase(wxString& str, size_t lenWanted = 1024)
-        : m_str(str), m_buf(lenWanted), m_len(0), m_lenSet(false)
+        : wxStringTypeBufferBase<T>(str, lenWanted),
+          m_len(0),
+          m_lenSet(false)
        { }

-    operator CharType*() { return m_buf.data(); }
+    ~wxStringTypeBufferLengthBase()
+    {
+        wxASSERT_MSG( this->m_lenSet, "forgot to call SetLength()" );
+    }
+
    void SetLength(size_t length) { m_len = length; m_lenSet = true; }

 protected:
-    wxString& m_str;
-    wxCharTypeBuffer<CharType> m_buf;
-    size_t        m_len;
-    bool          m_lenSet;
+    size_t m_len;
+    bool m_lenSet;
 };

 template<typename T>
@ -2817,7 +2936,9 @@ class wxStringTypeBuffer : public wxStringTypeBufferBase<T>
 {
 public:
    wxStringTypeBuffer(wxString& str, size_t lenWanted = 1024)
-        : wxStringTypeBufferBase<T>(str, lenWanted) {}
+        : wxStringTypeBufferBase<T>(str, lenWanted)
+        { }
+
    ~wxStringTypeBuffer()
    {
        this->m_str.assign(this->m_buf.data());
@ -2831,11 +2952,11 @@ class wxStringTypeBufferLength : public wxStringTypeBufferLengthBase<T>
 {
 public:
    wxStringTypeBufferLength(wxString& str, size_t lenWanted = 1024)
-        : wxStringTypeBufferLengthBase<T>(str, lenWanted) {}
+        : wxStringTypeBufferLengthBase<T>(str, lenWanted)
+        { }

    ~wxStringTypeBufferLength()
    {
-        wxASSERT(this->m_lenSet);
        this->m_str.assign(this->m_buf.data(), this->m_len);
    }

@ -2869,12 +2990,12 @@ public:

    ~wxStringInternalBufferLength()
    {
-        wxASSERT(m_lenSet);
        m_str.m_impl.assign(m_buf.data(), m_len);
    }

    DECLARE_NO_COPY_CLASS(wxStringInternalBufferLength)
 };
+
 #endif // wxUSE_STL_BASED_WXSTRING


--- a/interface/string.h
+++ b/interface/string.h
@ -72,25 +72,25 @@ public:
    @class wxString
    @wxheader{string.h}

-    wxString is a class representing a Unicode character string.  
+    wxString is a class representing a Unicode character string.
    wxString uses @c std::string internally to store its content
    unless this is not supported by the compiler or disabled
-    specifically when building wxWidgets. Therefore wxString 
+    specifically when building wxWidgets. Therefore wxString
    inherits many features from @c std::string's. Most
    implementations of @std::string are thread-safe and don't
    use reference counting. By default, wxString uses @c std::string
    internally even if wxUSE_STL is not defined.
-    
+
    Since wxWidgets 3.0 wxString internally uses UCS-2 (basically 2-byte per
    character wchar_t) under Windows and UTF-8 under Unix, Linux and
    OS X to store its content. Much work has been done to make existing
-    code using ANSI string literals work as before. If you need to have a 
+    code using ANSI string literals work as before. If you need to have a
    wxString that uses wchar_t on Unix and Linux, too, you can specify
    this on the command line with the @c configure @c --disable-utf8 switch.

    As a consequence of this change, iterating over a wxString by index
    can become inefficient in UTF8 mode and iterators should be used instead:
-    
+
    @code
    wxString s = "hello";
    wxString::const_iterator i;
@ -100,9 +100,9 @@ public:
        // do something with it
    }
    @endcode
-    
-    Please see the 
-    @ref overview_string "wxString overview" and the 
+
+    Please see the
+    @ref overview_string "wxString overview" and the
    @ref overview_unicode "Unicode overview" for more information
    about it.

@ -112,7 +112,7 @@ public:
    conversion, the @a wxConvLibc class instance is used. See wxCSConv and wxMBConv.

    wxString implements most of the methods of the @c std::string class.
-    These standard functions are only listed here, but they are not 
+    These standard functions are only listed here, but they are not
    fully documented in this manual. Please see the STL documentation.
    The behaviour of all these functions is identical to the behaviour
    described there.
@ -125,7 +125,7 @@ public:
        Anything may be concatenated (appended to) with a string. However, you can't
        append something to a C string (including literal constants), so to do this it
        should be converted to a wxString first.
-        
+
        @li operator<<()
        @li operator+=()
        @li operator+()
@ -136,7 +136,7 @@ public:
        a single character or a wide (UNICODE) string. For all constructors (except the
        default which creates an empty string) there is also a corresponding assignment
        operator.
-        
+
        @li wxString()
        @li operator=()
        @li ~wxString()
@ -144,7 +144,7 @@ public:
        The MakeXXX() variants modify the string in place, while the other functions
        return a new string which contains the original text converted to the upper or
        lower case and leave the original string unchanged.
-        
+
        @li MakeUpper()
        @li Upper()
        @li MakeLower()
@ -158,8 +158,8 @@ public:
        done in release builds.
        This section also contains both implicit and explicit conversions to C style
        strings. Although implicit conversion is quite convenient, it is advised to use
-        explicit c_str() method for the sake of clarity. 
-        
+        explicit c_str() method for the sake of clarity.
+
        @li GetChar()
        @li GetWritableChar()
        @li SetChar()
@ -177,12 +177,12 @@ public:
        convenient if only equality of the strings matters because it returns a boolean
        @true value if the strings are the same and not 0 (which is usually @false
        in C)as Cmp() does.
-        Matches() is a poor man's regular expression matcher: it only understands 
+        Matches() is a poor man's regular expression matcher: it only understands
        '*' and '?' metacharacters in the sense of DOS command line interpreter.
        StartsWith() is helpful when parsing a line of text which should start
        with some predefined prefix and is more efficient than doing direct string
        comparison as you would also have to precalculate the length of the prefix then.
-        
+
        @li Cmp()
        @li CmpNoCase()
        @li IsSameAs()
@ -194,7 +194,7 @@ public:
        floating point numbers. All three functions take a pointer to the variable to
        put the numeric value in and return @true if the @b entire string could be
        converted to a number.
-        
+
        @li ToLong()
        @li ToLongLong()
        @li ToULong()
@ -206,21 +206,21 @@ public:
        wxStringBuffer and wxStringBufferLength classes may be very useful
        when working with some external API which requires the caller to provide
        a writable buffer.
-        
+
        @li Alloc()
        @li Shrink()
        @li wxStringBuffer
        @li wxStringBufferLength

        Misc. other string functions.
-        
+
        @li Trim()
        @li Truncate()
        @li Pad()

        These functions return the string length and check whether the string
        is empty or empty it.
-        
+
        @li Len()
        @li IsEmpty()
        @li operator!()
@ -231,7 +231,7 @@ public:
        These functions allow to extract substring from this string. All of them don't
        modify the original string and return a new string containing the extracted
        substring.
-        
+
        @li Mid()
        @li operator()()
        @li Left()
@ -245,7 +245,7 @@ public:

        These functions replace the standard @e strchr() and @e strstr()
        functions.
-        
+
        @li Find()
        @li Replace()

@ -261,7 +261,7 @@ public:

        These functions are deprecated, please consider using new wxWidgets 2.0
        functions instead of them (or, even better, std::string compatible variants).
-        
+
        Contains(), First(), Freq(), IsAscii(), IsNull(),
        IsNumber(), IsWord(), Last(), Length(), LowerCase(), Remove(), Strip(),
        SubString(), UpperCase()
@ -283,7 +283,7 @@ public:
    */
    static const size_t npos;

-    /** 
+    /**
        @name Standard types
    */
    //@{
@ -300,13 +300,13 @@ public:
       Default constructor
    */
    wxString();
-    
+
    /**
-       Creates a string from another string. Just increases the ref 
+       Creates a string from another string. Just increases the ref
       count by 1.
    */
    wxString(const wxString& stringSrc);
-    
+

    /**
       Constructs a string from the string literal @e psz using
@ -347,23 +347,23 @@ public:
       the current locale encoding to convert it to Unicode.
    */
    wxString(const wxCharBuffer& buf);
-    
+
    /**
       Constructs a string from @e buf.
    */
    wxString(const wxWCharBuffer& buf);

    /**
-       Constructs a string from @e str using the using the current locale encoding 
+       Constructs a string from @e str using the using the current locale encoding
       to convert it to Unicode (wxConvLibc).
    */
    wxString(const std::string& str);
-    
+
    /**
       Constructs a string from @e str.
    */
    wxString(const std::wstring& str);
-    
+

    /**
        String destructor. Note that this is not virtual, so wxString must not be
@ -490,7 +490,7 @@ public:
        Returns a positive value if the string is greater than the argument,
        zero if it is equal to it or a negative value if it is less than the
        argument (same semantics as the standard @c strcmp() function).
-        
+
        See also CmpNoCase(), IsSameAs().
    */
    int Cmp(const wxString& s) const;
@ -500,7 +500,7 @@ public:
        Returns a positive value if the string is greater than the argument,
        zero if it is equal to it or a negative value if it is less than the
        argument (same semantics as the standard @c strcmp() function).
-        
+
        See also Cmp(), IsSameAs().
    */
    int CmpNoCase(const wxString& s) const;
@ -553,9 +553,9 @@ public:
        @c wxNOT_FOUND if not found.
    */
    int Find(wxUniChar ch, bool fromEnd = false) const;
-    
+
    /**
-        Searches for the given string @e sub. Returns the starting position or 
+        Searches for the given string @e sub. Returns the starting position or
        @c wxNOT_FOUND if not found.
    */
    int Find(const wxString& sub) const;
@ -563,7 +563,7 @@ public:
    //@{
    /**
        Same as Find().
-        This is a wxWidgets 1.xx compatibility function; 
+        This is a wxWidgets 1.xx compatibility function;
        you should not use it in new code.
    */
    int First(wxUniChar ch) const;
@ -616,7 +616,7 @@ public:
    //@{
    /**
        Converts the string or character from an ASCII, 7-bit form
-        to the native wxString representation. 
+        to the native wxString representation.
    */
    static wxString FromAscii(const char* s);
    static wxString FromAscii(const unsigned char* s);
@ -710,7 +710,7 @@ public:
    //@{
    /**
        Returns a reference to the last character (writable).
-        This is a wxWidgets 1.xx compatibility function; 
+        This is a wxWidgets 1.xx compatibility function;
        you should not use it in new code.
    */
    wxUniCharRef Last();
@ -1008,7 +1008,7 @@ public:
    /**
        Returns a pointer to the string data (@c const char* when using UTF-8
        internally, @c const wchar_t* when using UCS-2 internally).
-        
+
        Note that the returned value is not convertible to @c char* or
        @c wchar_t*, use char_str() or wchar_str() if you need to pass
        string value to a function expecting non-const pointer.
@ -1026,10 +1026,33 @@ public:
    */
    wxWritableCharBuffer char_str(const wxMBConv& conv = wxConvLibc) const;

+    /**
+        Returns buffer of the specified type containing the string data.
+
+        This method is only useful in template code, otherwise you should
+        directly call mb_str() or wc_str() if you need to retrieve a narrow or
+        wide string from this wxString. The template parameter @a t should be
+        either @c char or @c wchar_t.
+
+        Notice that retrieving a char buffer in UTF-8 build will return the
+        internal string representation in UTF-8 while in wchar_t build the char
+        buffer will contain the conversion of the string to the encoding of the
+        current locale (and so can fail).
+
+        @param len If non-@NULL, filled with the length of the returned buffer.
+        @return
+            buffer containing the string contents in the specified type,
+            notice that it may be @NULL if the conversion failed (e.g. Unicode
+            string couldn't be converted to the current encoding when @a T is
+            @c char).
+     */
+    template <typename T>
+    wxCharTypeBuffer<T> tchar_str(size_t *len = NULL) const;
+
    //@{
    /**
        Returns string representation suitable for passing to OS' functions
-        for file handling. 
+        for file handling.
    */
    const wchar_t* fn_str() const;
    const char* fn_str() const;
@ -1110,7 +1133,7 @@ public:
    /**
        Empty string is @false, so !string will only return @true if the
        string is empty.
-        
+
        See also IsEmpty().
    */
    bool operator!() const;
@ -1131,7 +1154,7 @@ public:
        Converts the strings contents to the wide character represention
        and returns it as a temporary wxWCharBuffer object or returns a
        pointer to the internal string contents in wide character mode.
-        
+
        The macro wxWX2WCbuf is defined as the correct return
        type (without const).

@ -1154,7 +1177,7 @@ public:

    /**
        @name Iterator interface
-        
+
        These methods return iterators to the beginnnig or
        end of the string.
    */
@ -1172,8 +1195,8 @@ public:

    /**
        @name STL interface
-    
-        The supported STL functions are listed here. Please see any 
+
+        The supported STL functions are listed here. Please see any
        STL reference for their documentation.
    */
    //@{
@ -1200,7 +1223,7 @@ public:
        wxString& assign(const_iterator first, const_iterator last);

        void clear();
-        
+
        int compare(const wxString& str) const;
        int compare(size_t nStart, size_t nLen, const wxString& str) const;
        int compare(size_t nStart, size_t nLen,
@ -1257,9 +1280,9 @@ public:
        size_t rfind(wxUniChar ch, size_t nStart = npos) const;

        wxString substr(size_t nStart = 0, size_t nLen = npos) const;
-    
+
        void swap(wxString& str);
-  
+
    //@}

 };
--- a/tests/strings/strings.cpp
+++ b/tests/strings/strings.cpp
@ -53,7 +53,7 @@ private:
        CPPUNIT_TEST( ToULongLong );
 #endif // wxLongLong_t
        CPPUNIT_TEST( ToDouble );
-        CPPUNIT_TEST( WriteBuf );
+        CPPUNIT_TEST( StringBuf );
        CPPUNIT_TEST( UTF8Buf );
        CPPUNIT_TEST( CStrDataTernaryOperator );
        CPPUNIT_TEST( CStrDataOperators );
@ -82,7 +82,7 @@ private:
    void ToULongLong();
 #endif // wxLongLong_t
    void ToDouble();
-    void WriteBuf();
+    void StringBuf();
    void UTF8Buf();
    void CStrDataTernaryOperator();
    void DoCStrDataTernaryOperator(bool cond);
@ -661,31 +661,50 @@ void StringTestCase::ToDouble()
    }
 }

-void StringTestCase::WriteBuf()
+void StringTestCase::StringBuf()
 {
+    // check that buffer can be used to write into the string
    wxString s;
    wxStrcpy(wxStringBuffer(s, 10), _T("foo"));

-    CPPUNIT_ASSERT(s[0u] == _T('f') );
+    WX_ASSERT_SIZET_EQUAL(3, s.length());
    CPPUNIT_ASSERT(_T('f') == s[0u]);
    CPPUNIT_ASSERT(_T('o') == s[1]);
    CPPUNIT_ASSERT(_T('o') == s[2]);
-    WX_ASSERT_SIZET_EQUAL(3, s.length());

+    {
+        // also check that the buffer initially contains the original string
+        // contents
+        wxStringBuffer buf(s, 10);
+        CPPUNIT_ASSERT_EQUAL( _T('f'), buf[0] );
+        CPPUNIT_ASSERT_EQUAL( _T('o'), buf[1] );
+        CPPUNIT_ASSERT_EQUAL( _T('o'), buf[2] );
+        CPPUNIT_ASSERT_EQUAL( _T('\0'), buf[3] );
+    }

    {
        wxStringBufferLength buf(s, 10);
+        CPPUNIT_ASSERT_EQUAL( _T('f'), buf[0] );
+        CPPUNIT_ASSERT_EQUAL( _T('o'), buf[1] );
+        CPPUNIT_ASSERT_EQUAL( _T('o'), buf[2] );
+        CPPUNIT_ASSERT_EQUAL( _T('\0'), buf[3] );
+
+        // and check that it can be used to write only the specified number of
+        // characters to the string
        wxStrcpy(buf, _T("barrbaz"));
        buf.SetLength(4);
    }

+    WX_ASSERT_SIZET_EQUAL(4, s.length());
    CPPUNIT_ASSERT(_T('b') == s[0u]);
    CPPUNIT_ASSERT(_T('a') == s[1]);
    CPPUNIT_ASSERT(_T('r') == s[2]);
    CPPUNIT_ASSERT(_T('r') == s[3]);
-    WX_ASSERT_SIZET_EQUAL(4, s.length());

-    CPPUNIT_ASSERT_EQUAL( 0, wxStrcmp(_T("barr"), s) );
+    // check that creating buffer of length smaller than string works, i.e. at
+    // least doesn't crash (it would if we naively copied the entire original
+    // string contents in the buffer)
+    *wxStringBuffer(s, 1) = '!';
 }

 void StringTestCase::UTF8Buf()