Change QStringBuilder to use UTF-8 too
This commit completes the previous commit so that both QString and QStringBuilder now operate on UTF-8 input. A small fix was required in QStringBuilder: an if clause isn't enough to separate the two append versions. Since there are no QString functions that append to char*, if we're converting to a QByteArray, we need to go through a QString first in a separate function. Change-Id: Ic503340c5d0c32d420c90c91cc2e0fc1ae9230f3 Reviewed-by: Lars Knoll <lars.knoll@nokia.com>
This commit is contained in:
parent
592fe0a026
commit
8ddd8c8ba9
@ -108,12 +108,24 @@ void QAbstractConcatenable::convertFromAscii(const char *a, int len, QChar *&out
|
|||||||
if (len == -1) {
|
if (len == -1) {
|
||||||
if (!a)
|
if (!a)
|
||||||
return;
|
return;
|
||||||
while (*a)
|
while (*a && uchar(*a) < 0x80U)
|
||||||
*out++ = QLatin1Char(*a++);
|
*out++ = QLatin1Char(*a++);
|
||||||
|
if (!*a)
|
||||||
|
return;
|
||||||
} else {
|
} else {
|
||||||
for (int i = 0; i < len; ++i)
|
int i;
|
||||||
|
for (i = 0; i < len && uchar(a[i]) < 0x80U; ++i)
|
||||||
*out++ = QLatin1Char(a[i]);
|
*out++ = QLatin1Char(a[i]);
|
||||||
|
if (i == len)
|
||||||
|
return;
|
||||||
|
a += i;
|
||||||
|
len -= i;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// we need to complement with UTF-8 appending
|
||||||
|
QString tmp = QString::fromUtf8(a, len);
|
||||||
|
memcpy(out, reinterpret_cast<const char *>(tmp.constData()), sizeof(QChar) * tmp.size());
|
||||||
|
out += tmp.size();
|
||||||
}
|
}
|
||||||
|
|
||||||
QT_END_NAMESPACE
|
QT_END_NAMESPACE
|
||||||
|
@ -381,15 +381,11 @@ operator+(const A &a, const B &b)
|
|||||||
}
|
}
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
|
namespace QtStringBuilder {
|
||||||
template <typename A, typename B>
|
template <typename A, typename B>
|
||||||
QByteArray &operator+=(QByteArray &a, const QStringBuilder<A, B> &b)
|
QByteArray &appendToByteArray(QByteArray &a, const QStringBuilder<A, B> &b, char)
|
||||||
{
|
{
|
||||||
#ifndef QT_NO_CAST_TO_ASCII
|
// append 8-bit data to a byte array
|
||||||
if (sizeof(typename QConcatenable< QStringBuilder<A, B> >::ConvertTo::value_type) == sizeof(QChar)) {
|
|
||||||
//it is not save to optimize as in utf8 it is not possible to compute the size
|
|
||||||
return a += QString(b);
|
|
||||||
}
|
|
||||||
#endif
|
|
||||||
int len = a.size() + QConcatenable< QStringBuilder<A, B> >::size(b);
|
int len = a.size() + QConcatenable< QStringBuilder<A, B> >::size(b);
|
||||||
a.reserve(len);
|
a.reserve(len);
|
||||||
char *it = a.data() + a.size();
|
char *it = a.data() + a.size();
|
||||||
@ -398,6 +394,23 @@ QByteArray &operator+=(QByteArray &a, const QStringBuilder<A, B> &b)
|
|||||||
return a;
|
return a;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
#ifndef QT_NO_CAST_TO_ASCII
|
||||||
|
template <typename A, typename B>
|
||||||
|
QByteArray &appendToByteArray(QByteArray &a, const QStringBuilder<A, B> &b, QChar)
|
||||||
|
{
|
||||||
|
// append UTF-16 data to the byte array
|
||||||
|
return a += QString(b);
|
||||||
|
}
|
||||||
|
#endif
|
||||||
|
}
|
||||||
|
|
||||||
|
template <typename A, typename B>
|
||||||
|
QByteArray &operator+=(QByteArray &a, const QStringBuilder<A, B> &b)
|
||||||
|
{
|
||||||
|
return QtStringBuilder::appendToByteArray(a, b,
|
||||||
|
typename QConcatenable< QStringBuilder<A, B> >::ConvertTo::value_type());
|
||||||
|
}
|
||||||
|
|
||||||
template <typename A, typename B>
|
template <typename A, typename B>
|
||||||
QString &operator+=(QString &a, const QStringBuilder<A, B> &b)
|
QString &operator+=(QString &a, const QStringBuilder<A, B> &b)
|
||||||
{
|
{
|
||||||
|
@ -45,7 +45,7 @@
|
|||||||
#define LITERAL_LEN (sizeof(LITERAL)-1)
|
#define LITERAL_LEN (sizeof(LITERAL)-1)
|
||||||
#define LITERAL_EXTRA "some literal" "EXTRA"
|
#define LITERAL_EXTRA "some literal" "EXTRA"
|
||||||
|
|
||||||
// "some literal", but replacing all vocals by their umlauted UTF-8 string :)
|
// "some literal", but replacing all vowels by their umlauted UTF-8 string :)
|
||||||
#define UTF8_LITERAL "s\xc3\xb6m\xc3\xab l\xc3\xaft\xc3\xabr\xc3\xa4l"
|
#define UTF8_LITERAL "s\xc3\xb6m\xc3\xab l\xc3\xaft\xc3\xabr\xc3\xa4l"
|
||||||
#define UTF8_LITERAL_LEN (sizeof(UTF8_LITERAL)-1)
|
#define UTF8_LITERAL_LEN (sizeof(UTF8_LITERAL)-1)
|
||||||
#define UTF8_LITERAL_EXTRA "s\xc3\xb6m\xc3\xab l\xc3\xaft\xc3\xabr\xc3\xa4l" "EXTRA"
|
#define UTF8_LITERAL_EXTRA "s\xc3\xb6m\xc3\xab l\xc3\xaft\xc3\xabr\xc3\xa4l" "EXTRA"
|
||||||
@ -131,14 +131,6 @@ void runScenario()
|
|||||||
r = string P ba;
|
r = string P ba;
|
||||||
QCOMPARE(r, r2);
|
QCOMPARE(r, r2);
|
||||||
|
|
||||||
#if 0
|
|
||||||
// now test with codec for C strings set
|
|
||||||
// TODO: to be re-enabled once strings default to utf8, in place of the
|
|
||||||
// latin1 code above.
|
|
||||||
QTextCodec::setCodecForCStrings(QTextCodec::codecForName("UTF-8"));
|
|
||||||
QVERIFY(QTextCodec::codecForCStrings());
|
|
||||||
QCOMPARE(QTextCodec::codecForCStrings()->name(), QByteArray("UTF-8"));
|
|
||||||
|
|
||||||
string = QString::fromUtf8(UTF8_LITERAL);
|
string = QString::fromUtf8(UTF8_LITERAL);
|
||||||
ba = UTF8_LITERAL;
|
ba = UTF8_LITERAL;
|
||||||
|
|
||||||
@ -157,7 +149,6 @@ void runScenario()
|
|||||||
QCOMPARE(r, r3);
|
QCOMPARE(r, r3);
|
||||||
r = string P ba;
|
r = string P ba;
|
||||||
QCOMPARE(r, r3);
|
QCOMPARE(r, r3);
|
||||||
#endif
|
|
||||||
|
|
||||||
ba = QByteArray(); // empty
|
ba = QByteArray(); // empty
|
||||||
r = ba P string;
|
r = ba P string;
|
||||||
@ -217,11 +208,8 @@ void runScenario()
|
|||||||
str += QLatin1String(LITERAL) P str;
|
str += QLatin1String(LITERAL) P str;
|
||||||
QCOMPARE(str, QString::fromUtf8(UTF8_LITERAL LITERAL UTF8_LITERAL));
|
QCOMPARE(str, QString::fromUtf8(UTF8_LITERAL LITERAL UTF8_LITERAL));
|
||||||
#ifndef QT_NO_CAST_FROM_ASCII
|
#ifndef QT_NO_CAST_FROM_ASCII
|
||||||
#if 0
|
|
||||||
// TODO: this relies on strings defaulting to utf8, so disable this for now.
|
|
||||||
str = (QString::fromUtf8(UTF8_LITERAL) += QLatin1String(LITERAL) P UTF8_LITERAL);
|
str = (QString::fromUtf8(UTF8_LITERAL) += QLatin1String(LITERAL) P UTF8_LITERAL);
|
||||||
QCOMPARE(str, QString::fromUtf8(UTF8_LITERAL LITERAL UTF8_LITERAL));
|
QCOMPARE(str, QString::fromUtf8(UTF8_LITERAL LITERAL UTF8_LITERAL));
|
||||||
#endif
|
|
||||||
#endif
|
#endif
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -237,13 +225,10 @@ void runScenario()
|
|||||||
ba2 += ba2 P withZero;
|
ba2 += ba2 P withZero;
|
||||||
QCOMPARE(ba2, QByteArray(withZero + withZero + withZero));
|
QCOMPARE(ba2, QByteArray(withZero + withZero + withZero));
|
||||||
#ifndef QT_NO_CAST_TO_ASCII
|
#ifndef QT_NO_CAST_TO_ASCII
|
||||||
#if 0
|
|
||||||
// TODO: this relies on strings defaulting to utf8, so disable this for now.
|
|
||||||
ba = UTF8_LITERAL;
|
ba = UTF8_LITERAL;
|
||||||
ba2 = (ba += QLatin1String(LITERAL) + QString::fromUtf8(UTF8_LITERAL));
|
ba2 = (ba += QLatin1String(LITERAL) + QString::fromUtf8(UTF8_LITERAL));
|
||||||
QCOMPARE(ba2, ba);
|
QCOMPARE(ba2, ba);
|
||||||
QCOMPARE(ba, QByteArray(UTF8_LITERAL LITERAL UTF8_LITERAL));
|
QCOMPARE(ba, QByteArray(UTF8_LITERAL LITERAL UTF8_LITERAL));
|
||||||
#endif
|
|
||||||
#endif
|
#endif
|
||||||
}
|
}
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user