9334ad1727
We didn't handle the case when the length of the input buffer was not specified correctly and wxConvAuto::DetectBOM() could read beyond the end of input. Moreover, the unit test actually relied on this as it didn't pass the correct length for the literal strings with embedded NULs. This somehow worked with MSVC but failed with MinGW (see #10713). Correct the code to handle wxNO_LEN case correctly and fix the unit test to pass the correct lengths. git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@65739 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775
211 lines
5.7 KiB
C++
211 lines
5.7 KiB
C++
///////////////////////////////////////////////////////////////////////////////
|
|
// Name: tests/mbconv/convauto.cpp
|
|
// Purpose: wxConvAuto unit test
|
|
// Author: Vadim Zeitlin
|
|
// Created: 2006-04-04
|
|
// RCS-ID: $Id$
|
|
// Copyright: (c) 2006 Vadim Zeitlin
|
|
///////////////////////////////////////////////////////////////////////////////
|
|
|
|
// ----------------------------------------------------------------------------
|
|
// headers
|
|
// ----------------------------------------------------------------------------
|
|
|
|
#include "testprec.h"
|
|
|
|
#ifdef __BORLANDC__
|
|
#pragma hdrstop
|
|
#endif
|
|
|
|
#include "wx/convauto.h"
|
|
|
|
#include "wx/mstream.h"
|
|
#include "wx/txtstrm.h"
|
|
|
|
// ----------------------------------------------------------------------------
|
|
// test class
|
|
// ----------------------------------------------------------------------------
|
|
|
|
class ConvAutoTestCase : public CppUnit::TestCase
|
|
{
|
|
public:
|
|
ConvAutoTestCase() { }
|
|
|
|
private:
|
|
CPPUNIT_TEST_SUITE( ConvAutoTestCase );
|
|
CPPUNIT_TEST( Empty );
|
|
CPPUNIT_TEST( Short );
|
|
CPPUNIT_TEST( None );
|
|
CPPUNIT_TEST( UTF32LE );
|
|
CPPUNIT_TEST( UTF32BE );
|
|
CPPUNIT_TEST( UTF16LE );
|
|
CPPUNIT_TEST( UTF16BE );
|
|
CPPUNIT_TEST( UTF8 );
|
|
CPPUNIT_TEST( StreamUTF8NoBOM );
|
|
CPPUNIT_TEST( StreamUTF8 );
|
|
CPPUNIT_TEST( StreamUTF16LE );
|
|
CPPUNIT_TEST( StreamUTF16BE );
|
|
CPPUNIT_TEST( StreamUTF32LE );
|
|
CPPUNIT_TEST( StreamUTF32BE );
|
|
CPPUNIT_TEST_SUITE_END();
|
|
|
|
// real test function: check that converting the src multibyte string to
|
|
// wide char using wxConvAuto yields wch as the first result
|
|
//
|
|
// the length of the string may need to be passed explicitly if it has
|
|
// embedded NULs, otherwise it's not necessary
|
|
void TestFirstChar(const char *src, wchar_t wch, int len = wxNO_LEN);
|
|
|
|
void Empty();
|
|
void Short();
|
|
void None();
|
|
void UTF32LE();
|
|
void UTF32BE();
|
|
void UTF16LE();
|
|
void UTF16BE();
|
|
void UTF8();
|
|
|
|
// test whether two lines of text are converted properly from a stream
|
|
void TestTextStream(const char *src,
|
|
size_t srclength,
|
|
const wxString& line1,
|
|
const wxString& line2);
|
|
|
|
void StreamUTF8NoBOM();
|
|
void StreamUTF8();
|
|
void StreamUTF16LE();
|
|
void StreamUTF16BE();
|
|
void StreamUTF32LE();
|
|
void StreamUTF32BE();
|
|
};
|
|
|
|
// register in the unnamed registry so that these tests are run by default
|
|
CPPUNIT_TEST_SUITE_REGISTRATION(ConvAutoTestCase);
|
|
|
|
// also include in it's own registry so that these tests can be run alone
|
|
CPPUNIT_TEST_SUITE_NAMED_REGISTRATION(ConvAutoTestCase, "ConvAutoTestCase");
|
|
|
|
// ----------------------------------------------------------------------------
|
|
// tests
|
|
// ----------------------------------------------------------------------------
|
|
|
|
void ConvAutoTestCase::TestFirstChar(const char *src, wchar_t wch, int len)
|
|
{
|
|
wxWCharBuffer wbuf = wxConvAuto().cMB2WC(src, len, NULL);
|
|
CPPUNIT_ASSERT( wbuf );
|
|
CPPUNIT_ASSERT_EQUAL( wch, *wbuf );
|
|
}
|
|
|
|
void ConvAutoTestCase::Empty()
|
|
{
|
|
CPPUNIT_ASSERT( !wxConvAuto().cMB2WC("") );
|
|
}
|
|
|
|
void ConvAutoTestCase::Short()
|
|
{
|
|
TestFirstChar("1", wxT('1'));
|
|
}
|
|
|
|
void ConvAutoTestCase::None()
|
|
{
|
|
TestFirstChar("Hello world", wxT('H'));
|
|
}
|
|
|
|
void ConvAutoTestCase::UTF32LE()
|
|
{
|
|
TestFirstChar("\xff\xfe\0\0A\0\0\0", wxT('A'), 8);
|
|
}
|
|
|
|
void ConvAutoTestCase::UTF32BE()
|
|
{
|
|
TestFirstChar("\0\0\xfe\xff\0\0\0B", wxT('B'), 8);
|
|
}
|
|
|
|
void ConvAutoTestCase::UTF16LE()
|
|
{
|
|
TestFirstChar("\xff\xfeZ\0", wxT('Z'), 4);
|
|
}
|
|
|
|
void ConvAutoTestCase::UTF16BE()
|
|
{
|
|
TestFirstChar("\xfe\xff\0Y", wxT('Y'), 4);
|
|
}
|
|
|
|
void ConvAutoTestCase::UTF8()
|
|
{
|
|
#ifdef wxHAVE_U_ESCAPE
|
|
TestFirstChar("\xef\xbb\xbf\xd0\x9f", L'\u041f');
|
|
#endif
|
|
}
|
|
|
|
void ConvAutoTestCase::TestTextStream(const char *src,
|
|
size_t srclength,
|
|
const wxString& line1,
|
|
const wxString& line2)
|
|
{
|
|
wxMemoryInputStream instream(src, srclength);
|
|
wxTextInputStream text(instream);
|
|
|
|
CPPUNIT_ASSERT_EQUAL( line1, text.ReadLine() );
|
|
CPPUNIT_ASSERT_EQUAL( line2, text.ReadLine() );
|
|
}
|
|
|
|
// the first line of the teststring used in the following functions is an
|
|
// 'a' followed by a Japanese hiragana A (u+3042).
|
|
// The second line is a single Greek beta (u+03B2). There is no blank line
|
|
// at the end.
|
|
|
|
namespace
|
|
{
|
|
|
|
const wxString line1 = wxString::FromUTF8("a\xe3\x81\x82");
|
|
const wxString line2 = wxString::FromUTF8("\xce\xb2");
|
|
|
|
} // anonymous namespace
|
|
|
|
void ConvAutoTestCase::StreamUTF8NoBOM()
|
|
{
|
|
// currently this test doesn't work because without the BOM wxConvAuto
|
|
// decides that the string is in Latin-1 after finding the first (but not
|
|
// the two subsequent ones which are part of the same UTF-8 sequence!)
|
|
// 8-bit character
|
|
//
|
|
// FIXME: we need to fix this at wxTextInputStream level, see #11570
|
|
#if 0
|
|
TestTextStream("\x61\xE3\x81\x82\x0A\xCE\xB2",
|
|
7, line1, line2);
|
|
#endif
|
|
}
|
|
|
|
void ConvAutoTestCase::StreamUTF8()
|
|
{
|
|
TestTextStream("\xEF\xBB\xBF\x61\xE3\x81\x82\x0A\xCE\xB2",
|
|
10, line1, line2);
|
|
}
|
|
|
|
void ConvAutoTestCase::StreamUTF16LE()
|
|
{
|
|
TestTextStream("\xFF\xFE\x61\x00\x42\x30\x0A\x00\xB2\x03",
|
|
10, line1, line2);
|
|
}
|
|
|
|
void ConvAutoTestCase::StreamUTF16BE()
|
|
{
|
|
TestTextStream("\xFE\xFF\x00\x61\x30\x42\x00\x0A\x03\xB2",
|
|
10, line1, line2);
|
|
}
|
|
|
|
void ConvAutoTestCase::StreamUTF32LE()
|
|
{
|
|
TestTextStream("\xFF\xFE\0\0\x61\x00\0\0\x42\x30\0\0\x0A"
|
|
"\x00\0\0\xB2\x03\0\0",
|
|
20, line1, line2);
|
|
}
|
|
|
|
void ConvAutoTestCase::StreamUTF32BE()
|
|
{
|
|
TestTextStream("\0\0\xFE\xFF\0\0\x00\x61\0\0\x30\x42\0\0\x00\x0A"
|
|
"\0\0\x03\xB2",
|
|
20, line1, line2);
|
|
}
|