2017-09-27 00:25:20 +00:00
|
|
|
|
// © 2017 and later: Unicode, Inc. and others.
|
|
|
|
|
// License & terms of use: http://www.unicode.org/copyright.html
|
|
|
|
|
|
2017-10-04 22:51:06 +00:00
|
|
|
|
#include "unicode/utypes.h"
|
|
|
|
|
|
2017-10-05 00:47:38 +00:00
|
|
|
|
#if !UCONFIG_NO_FORMATTING && !UPRV_INCOMPLETE_CPP11_SUPPORT
|
2017-09-27 05:31:57 +00:00
|
|
|
|
|
2017-09-27 00:25:20 +00:00
|
|
|
|
#include "putilimp.h"
|
|
|
|
|
#include "unicode/dcfmtsym.h"
|
|
|
|
|
#include "numbertest.h"
|
|
|
|
|
#include "number_utils.h"
|
|
|
|
|
|
|
|
|
|
using namespace icu::number::impl;
|
|
|
|
|
|
|
|
|
|
class DefaultSymbolProvider : public SymbolProvider {
|
|
|
|
|
DecimalFormatSymbols fSymbols;
|
|
|
|
|
|
|
|
|
|
public:
|
|
|
|
|
DefaultSymbolProvider(UErrorCode &status) : fSymbols(Locale("ar_SA"), status) {}
|
|
|
|
|
|
2017-10-06 09:02:10 +00:00
|
|
|
|
virtual UnicodeString getSymbol(AffixPatternType type) const U_OVERRIDE {
|
2017-09-27 00:25:20 +00:00
|
|
|
|
switch (type) {
|
|
|
|
|
case TYPE_MINUS_SIGN:
|
|
|
|
|
return u"−";
|
|
|
|
|
case TYPE_PLUS_SIGN:
|
|
|
|
|
return fSymbols.getConstSymbol(DecimalFormatSymbols::ENumberFormatSymbol::kPlusSignSymbol);
|
|
|
|
|
case TYPE_PERCENT:
|
|
|
|
|
return fSymbols.getConstSymbol(DecimalFormatSymbols::ENumberFormatSymbol::kPercentSymbol);
|
|
|
|
|
case TYPE_PERMILLE:
|
|
|
|
|
return fSymbols.getConstSymbol(DecimalFormatSymbols::ENumberFormatSymbol::kPerMillSymbol);
|
|
|
|
|
case TYPE_CURRENCY_SINGLE:
|
|
|
|
|
return u"$";
|
|
|
|
|
case TYPE_CURRENCY_DOUBLE:
|
|
|
|
|
return u"XXX";
|
|
|
|
|
case TYPE_CURRENCY_TRIPLE:
|
|
|
|
|
return u"long name";
|
|
|
|
|
case TYPE_CURRENCY_QUAD:
|
|
|
|
|
return u"\uFFFD";
|
|
|
|
|
case TYPE_CURRENCY_QUINT:
|
|
|
|
|
// TODO: Add support for narrow currency symbols here.
|
|
|
|
|
return u"\uFFFD";
|
|
|
|
|
case TYPE_CURRENCY_OVERFLOW:
|
|
|
|
|
return u"\uFFFD";
|
|
|
|
|
default:
|
|
|
|
|
U_ASSERT(false);
|
2017-10-06 09:02:10 +00:00
|
|
|
|
return {}; // silence compiler warnings
|
2017-09-27 00:25:20 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
void AffixUtilsTest::runIndexedTest(int32_t index, UBool exec, const char *&name, char *) {
|
|
|
|
|
if (exec) {
|
|
|
|
|
logln("TestSuite AffixUtilsTest: ");
|
|
|
|
|
}
|
|
|
|
|
TESTCASE_AUTO_BEGIN;
|
|
|
|
|
TESTCASE_AUTO(testEscape);
|
|
|
|
|
TESTCASE_AUTO(testUnescape);
|
|
|
|
|
TESTCASE_AUTO(testContainsReplaceType);
|
|
|
|
|
TESTCASE_AUTO(testInvalid);
|
|
|
|
|
TESTCASE_AUTO(testUnescapeWithSymbolProvider);
|
|
|
|
|
TESTCASE_AUTO_END;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void AffixUtilsTest::testEscape() {
|
|
|
|
|
static const char16_t *cases[][2] = {{u"", u""},
|
|
|
|
|
{u"abc", u"abc"},
|
|
|
|
|
{u"-", u"'-'"},
|
|
|
|
|
{u"-!", u"'-'!"},
|
|
|
|
|
{u"−", u"−"},
|
|
|
|
|
{u"---", u"'---'"},
|
|
|
|
|
{u"-%-", u"'-%-'"},
|
|
|
|
|
{u"'", u"''"},
|
|
|
|
|
{u"-'", u"'-'''"},
|
|
|
|
|
{u"-'-", u"'-''-'"},
|
|
|
|
|
{u"a-'-", u"a'-''-'"}};
|
|
|
|
|
|
|
|
|
|
for (auto &cas : cases) {
|
|
|
|
|
UnicodeString input(cas[0]);
|
|
|
|
|
UnicodeString expected(cas[1]);
|
|
|
|
|
UnicodeString result = AffixUtils::escape(UnicodeStringCharSequence(input));
|
|
|
|
|
assertEquals(input, expected, result);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void AffixUtilsTest::testUnescape() {
|
|
|
|
|
static struct TestCase {
|
|
|
|
|
const char16_t *input;
|
|
|
|
|
bool currency;
|
|
|
|
|
int32_t expectedLength;
|
|
|
|
|
const char16_t *output;
|
|
|
|
|
} cases[] = {{u"", false, 0, u""},
|
|
|
|
|
{u"abc", false, 3, u"abc"},
|
|
|
|
|
{u"-", false, 1, u"−"},
|
|
|
|
|
{u"-!", false, 2, u"−!"},
|
|
|
|
|
{u"+", false, 1, u"\u061C+"},
|
|
|
|
|
{u"+!", false, 2, u"\u061C+!"},
|
|
|
|
|
{u"‰", false, 1, u"؉"},
|
|
|
|
|
{u"‰!", false, 2, u"؉!"},
|
|
|
|
|
{u"-x", false, 2, u"−x"},
|
|
|
|
|
{u"'-'x", false, 2, u"-x"},
|
|
|
|
|
{u"'--''-'-x", false, 6, u"--'-−x"},
|
|
|
|
|
{u"''", false, 1, u"'"},
|
|
|
|
|
{u"''''", false, 2, u"''"},
|
|
|
|
|
{u"''''''", false, 3, u"'''"},
|
|
|
|
|
{u"''x''", false, 3, u"'x'"},
|
|
|
|
|
{u"¤", true, 1, u"$"},
|
|
|
|
|
{u"¤¤", true, 2, u"XXX"},
|
|
|
|
|
{u"¤¤¤", true, 3, u"long name"},
|
|
|
|
|
{u"¤¤¤¤", true, 4, u"\uFFFD"},
|
|
|
|
|
{u"¤¤¤¤¤", true, 5, u"\uFFFD"},
|
|
|
|
|
{u"¤¤¤¤¤¤", true, 6, u"\uFFFD"},
|
|
|
|
|
{u"¤¤¤a¤¤¤¤", true, 8, u"long namea\uFFFD"},
|
|
|
|
|
{u"a¤¤¤¤b¤¤¤¤¤c", true, 12, u"a\uFFFDb\uFFFDc"},
|
|
|
|
|
{u"¤!", true, 2, u"$!"},
|
|
|
|
|
{u"¤¤!", true, 3, u"XXX!"},
|
|
|
|
|
{u"¤¤¤!", true, 4, u"long name!"},
|
|
|
|
|
{u"-¤¤", true, 3, u"−XXX"},
|
|
|
|
|
{u"¤¤-", true, 3, u"XXX−"},
|
|
|
|
|
{u"'¤'", false, 1, u"¤"},
|
|
|
|
|
{u"%", false, 1, u"٪\u061C"},
|
|
|
|
|
{u"'%'", false, 1, u"%"},
|
|
|
|
|
{u"¤'-'%", true, 3, u"$-٪\u061C"},
|
|
|
|
|
{u"#0#@#*#;#", false, 9, u"#0#@#*#;#"}};
|
|
|
|
|
|
|
|
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
|
|
|
DefaultSymbolProvider defaultProvider(status);
|
|
|
|
|
assertSuccess("Constructing DefaultSymbolProvider", status);
|
|
|
|
|
|
|
|
|
|
for (TestCase cas : cases) {
|
|
|
|
|
UnicodeString input(cas.input);
|
|
|
|
|
UnicodeString output(cas.output);
|
|
|
|
|
|
|
|
|
|
assertEquals(input, cas.currency, AffixUtils::hasCurrencySymbols(UnicodeStringCharSequence(input), status));
|
|
|
|
|
assertSuccess("Spot 1", status);
|
|
|
|
|
assertEquals(input, cas.expectedLength, AffixUtils::estimateLength(UnicodeStringCharSequence(input), status));
|
|
|
|
|
assertSuccess("Spot 2", status);
|
|
|
|
|
|
|
|
|
|
UnicodeString actual = unescapeWithDefaults(defaultProvider, input, status);
|
|
|
|
|
assertSuccess("Spot 3", status);
|
|
|
|
|
assertEquals(input, output, actual);
|
|
|
|
|
|
|
|
|
|
int32_t ulength = AffixUtils::unescapedCodePointCount(UnicodeStringCharSequence(input), defaultProvider, status);
|
|
|
|
|
assertSuccess("Spot 4", status);
|
|
|
|
|
assertEquals(input, output.countChar32(), ulength);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void AffixUtilsTest::testContainsReplaceType() {
|
|
|
|
|
static struct TestCase {
|
|
|
|
|
const char16_t *input;
|
|
|
|
|
bool hasMinusSign;
|
|
|
|
|
const char16_t *output;
|
|
|
|
|
} cases[] = {{u"", false, u""},
|
|
|
|
|
{u"-", true, u"+"},
|
|
|
|
|
{u"-a", true, u"+a"},
|
|
|
|
|
{u"a-", true, u"a+"},
|
|
|
|
|
{u"a-b", true, u"a+b"},
|
|
|
|
|
{u"--", true, u"++"},
|
|
|
|
|
{u"x", false, u"x"}};
|
|
|
|
|
|
|
|
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
|
|
|
for (TestCase cas : cases) {
|
|
|
|
|
UnicodeString input(cas.input);
|
|
|
|
|
bool hasMinusSign = cas.hasMinusSign;
|
|
|
|
|
UnicodeString output(cas.output);
|
|
|
|
|
|
|
|
|
|
assertEquals(
|
|
|
|
|
input, hasMinusSign, AffixUtils::containsType(UnicodeStringCharSequence(input), TYPE_MINUS_SIGN, status));
|
|
|
|
|
assertSuccess("Spot 1", status);
|
|
|
|
|
assertEquals(
|
|
|
|
|
input, output, AffixUtils::replaceType(UnicodeStringCharSequence(input), TYPE_MINUS_SIGN, u'+', status));
|
|
|
|
|
assertSuccess("Spot 2", status);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void AffixUtilsTest::testInvalid() {
|
|
|
|
|
static const char16_t *invalidExamples[] = {
|
|
|
|
|
u"'", u"x'", u"'x", u"'x''", u"''x'"};
|
|
|
|
|
|
|
|
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
|
|
|
DefaultSymbolProvider defaultProvider(status);
|
|
|
|
|
assertSuccess("Constructing DefaultSymbolProvider", status);
|
|
|
|
|
|
|
|
|
|
for (const char16_t *strPtr : invalidExamples) {
|
|
|
|
|
UnicodeString str(strPtr);
|
|
|
|
|
|
|
|
|
|
status = U_ZERO_ERROR;
|
|
|
|
|
AffixUtils::hasCurrencySymbols(UnicodeStringCharSequence(str), status);
|
|
|
|
|
assertEquals("Should set error code spot 1", status, U_ILLEGAL_ARGUMENT_ERROR);
|
|
|
|
|
|
|
|
|
|
status = U_ZERO_ERROR;
|
|
|
|
|
AffixUtils::estimateLength(UnicodeStringCharSequence(str), status);
|
|
|
|
|
assertEquals("Should set error code spot 2", status, U_ILLEGAL_ARGUMENT_ERROR);
|
|
|
|
|
|
|
|
|
|
status = U_ZERO_ERROR;
|
|
|
|
|
unescapeWithDefaults(defaultProvider, str, status);
|
|
|
|
|
assertEquals("Should set error code spot 3", status, U_ILLEGAL_ARGUMENT_ERROR);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
class NumericSymbolProvider : public SymbolProvider {
|
|
|
|
|
public:
|
|
|
|
|
virtual UnicodeString getSymbol(AffixPatternType type) const {
|
|
|
|
|
return Int64ToUnicodeString(type < 0 ? -type : type);
|
|
|
|
|
}
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
void AffixUtilsTest::testUnescapeWithSymbolProvider() {
|
|
|
|
|
static const char16_t* cases[][2] = {
|
|
|
|
|
{u"", u""},
|
|
|
|
|
{u"-", u"1"},
|
|
|
|
|
{u"'-'", u"-"},
|
|
|
|
|
{u"- + % ‰ ¤ ¤¤ ¤¤¤ ¤¤¤¤ ¤¤¤¤¤", u"1 2 3 4 5 6 7 8 9"},
|
|
|
|
|
{u"'¤¤¤¤¤¤'", u"¤¤¤¤¤¤"},
|
|
|
|
|
{u"¤¤¤¤¤¤", u"\uFFFD"}
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
NumericSymbolProvider provider;
|
|
|
|
|
|
|
|
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
|
|
|
NumberStringBuilder sb;
|
|
|
|
|
for (auto cas : cases) {
|
|
|
|
|
UnicodeString input(cas[0]);
|
|
|
|
|
UnicodeString expected(cas[1]);
|
|
|
|
|
sb.clear();
|
|
|
|
|
AffixUtils::unescape(UnicodeStringCharSequence(input), sb, 0, provider, status);
|
|
|
|
|
assertSuccess("Spot 1", status);
|
|
|
|
|
assertEquals(input, expected, sb.toUnicodeString());
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// Test insertion position
|
|
|
|
|
sb.clear();
|
|
|
|
|
sb.append(u"abcdefg", UNUM_FIELD_COUNT, status);
|
|
|
|
|
assertSuccess("Spot 2", status);
|
|
|
|
|
AffixUtils::unescape(UnicodeStringCharSequence(UnicodeString(u"-+%")), sb, 4, provider, status);
|
|
|
|
|
assertSuccess("Spot 3", status);
|
|
|
|
|
assertEquals(u"Symbol provider into middle", u"abcd123efg", sb.toUnicodeString());
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
UnicodeString AffixUtilsTest::unescapeWithDefaults(const SymbolProvider &defaultProvider,
|
|
|
|
|
UnicodeString input, UErrorCode &status) {
|
|
|
|
|
NumberStringBuilder nsb;
|
|
|
|
|
int32_t length = AffixUtils::unescape(UnicodeStringCharSequence(input), nsb, 0, defaultProvider, status);
|
|
|
|
|
assertEquals("Return value of unescape", nsb.length(), length);
|
|
|
|
|
return nsb.toUnicodeString();
|
|
|
|
|
}
|
2017-09-27 05:31:57 +00:00
|
|
|
|
|
|
|
|
|
#endif /* #if !UCONFIG_NO_FORMATTING */
|