2017-01-20 00:20:31 +00:00
|
|
|
// © 2016 and later: Unicode, Inc. and others.
|
2016-06-15 18:58:17 +00:00
|
|
|
// License & terms of use: http://www.unicode.org/copyright.html
|
2009-03-09 23:40:15 +00:00
|
|
|
/********************************************************************
|
2016-02-24 21:48:56 +00:00
|
|
|
* COPYRIGHT:
|
2016-05-31 21:45:07 +00:00
|
|
|
* Copyright (c) 2009-2016, International Business Machines Corporation and
|
|
|
|
* others. All Rights Reserved.
|
2009-03-09 23:40:15 +00:00
|
|
|
********************************************************************/
|
|
|
|
/********************************************************************************
|
|
|
|
*
|
|
|
|
* File spooftest.c
|
|
|
|
*
|
|
|
|
*********************************************************************************/
|
|
|
|
/*C API TEST for the uspoof Unicode Indentifier Spoofing and Security API */
|
|
|
|
/**
|
|
|
|
* This is an API test for ICU spoof detection in plain C. It doesn't test very many cases, and doesn't
|
|
|
|
* try to test the full functionality. It just calls each function and verifies that it
|
|
|
|
* works on a basic level.
|
|
|
|
*
|
|
|
|
* More complete testing of spoof detection functionality is done with the C++ tests.
|
|
|
|
**/
|
|
|
|
|
|
|
|
#include "unicode/utypes.h"
|
2009-08-04 21:09:17 +00:00
|
|
|
#if !UCONFIG_NO_REGULAR_EXPRESSIONS && !UCONFIG_NO_NORMALIZATION
|
2009-03-09 23:40:15 +00:00
|
|
|
|
|
|
|
#include <stdlib.h>
|
|
|
|
#include <stdio.h>
|
|
|
|
#include <string.h>
|
|
|
|
#include "unicode/uspoof.h"
|
|
|
|
#include "unicode/ustring.h"
|
2009-03-28 00:28:35 +00:00
|
|
|
#include "unicode/uset.h"
|
2009-03-09 23:40:15 +00:00
|
|
|
#include "cintltst.h"
|
2016-02-24 21:48:56 +00:00
|
|
|
#include "cmemory.h"
|
2009-03-09 23:40:15 +00:00
|
|
|
|
|
|
|
#define TEST_ASSERT_SUCCESS(status) {if (U_FAILURE(status)) { \
|
2009-06-09 21:28:13 +00:00
|
|
|
log_err_status(status, "Failure at file %s, line %d, error = %s\n", __FILE__, __LINE__, u_errorName(status));}}
|
2009-03-09 23:40:15 +00:00
|
|
|
|
2009-03-28 00:28:35 +00:00
|
|
|
#define TEST_ASSERT(expr) {if ((expr)==FALSE) { \
|
|
|
|
log_err("Test Failure at file %s, line %d: \"%s\" is false.\n", __FILE__, __LINE__, #expr);};}
|
2009-03-09 23:40:15 +00:00
|
|
|
|
|
|
|
#define TEST_ASSERT_EQ(a, b) { if ((a) != (b)) { \
|
|
|
|
log_err("Test Failure at file %s, line %d: \"%s\" (%d) != \"%s\" (%d) \n", \
|
|
|
|
__FILE__, __LINE__, #a, (a), #b, (b)); }}
|
|
|
|
|
|
|
|
#define TEST_ASSERT_NE(a, b) { if ((a) == (b)) { \
|
|
|
|
log_err("Test Failure at file %s, line %d: \"%s\" (%d) == \"%s\" (%d) \n", \
|
|
|
|
__FILE__, __LINE__, #a, (a), #b, (b)); }}
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
* TEST_SETUP and TEST_TEARDOWN
|
|
|
|
* macros to handle the boilerplate around setting up test case.
|
|
|
|
* Put arbitrary test code between SETUP and TEARDOWN.
|
|
|
|
* "sc" is the ready-to-go SpoofChecker for use in the tests.
|
|
|
|
*/
|
|
|
|
#define TEST_SETUP { \
|
|
|
|
UErrorCode status = U_ZERO_ERROR; \
|
|
|
|
USpoofChecker *sc; \
|
|
|
|
sc = uspoof_open(&status); \
|
2009-03-28 00:28:35 +00:00
|
|
|
TEST_ASSERT_SUCCESS(status); \
|
|
|
|
if (U_SUCCESS(status)){
|
2009-03-09 23:40:15 +00:00
|
|
|
|
|
|
|
#define TEST_TEARDOWN \
|
|
|
|
} \
|
|
|
|
TEST_ASSERT_SUCCESS(status); \
|
|
|
|
uspoof_close(sc); \
|
|
|
|
}
|
|
|
|
|
2015-09-07 01:18:49 +00:00
|
|
|
static void TestOpenFromSource(void);
|
2009-03-09 23:40:15 +00:00
|
|
|
static void TestUSpoofCAPI(void);
|
|
|
|
|
|
|
|
void addUSpoofTest(TestNode** root);
|
|
|
|
|
|
|
|
void addUSpoofTest(TestNode** root)
|
|
|
|
{
|
2009-08-04 21:09:17 +00:00
|
|
|
#if !UCONFIG_NO_FILE_IO
|
2015-09-07 01:18:49 +00:00
|
|
|
addTest(root, &TestOpenFromSource, "uspoof/TestOpenFromSource");
|
2009-08-04 21:09:17 +00:00
|
|
|
#endif
|
2015-09-07 01:18:49 +00:00
|
|
|
addTest(root, &TestUSpoofCAPI, "uspoof/TestUSpoofCAPI");
|
2009-03-09 23:40:15 +00:00
|
|
|
}
|
|
|
|
|
2009-03-28 00:28:35 +00:00
|
|
|
/*
|
2009-04-01 01:09:49 +00:00
|
|
|
* Identifiers for verifying that spoof checking is minimally alive and working.
|
2009-03-28 00:28:35 +00:00
|
|
|
*/
|
2010-10-15 00:01:43 +00:00
|
|
|
const UChar goodLatin[] = {(UChar)0x75, (UChar)0x7a, 0}; /* "uz", all ASCII */
|
2009-04-01 01:09:49 +00:00
|
|
|
/* (not confusable) */
|
|
|
|
const UChar scMixed[] = {(UChar)0x73, (UChar)0x0441, 0}; /* "sc", with Cyrillic 'c' */
|
|
|
|
/* (mixed script, confusable */
|
2009-03-30 23:05:55 +00:00
|
|
|
|
2009-04-01 01:09:49 +00:00
|
|
|
const UChar scLatin[] = {(UChar)0x73, (UChar)0x63, 0}; /* "sc", plain ascii. */
|
2009-03-30 23:05:55 +00:00
|
|
|
const UChar goodCyrl[] = {(UChar)0x438, (UChar)0x43B, 0}; /* Plain lower case Cyrillic letters,
|
2009-04-01 01:09:49 +00:00
|
|
|
no latin confusables */
|
2009-03-28 00:28:35 +00:00
|
|
|
|
2009-04-01 01:09:49 +00:00
|
|
|
const UChar goodGreek[] = {(UChar)0x3c0, (UChar)0x3c6, 0}; /* Plain lower case Greek letters */
|
2009-03-30 23:05:55 +00:00
|
|
|
|
2009-04-01 01:09:49 +00:00
|
|
|
const UChar lll_Latin_a[] = {(UChar)0x6c, (UChar)0x49, (UChar)0x31, 0}; /* lI1, all ASCII */
|
|
|
|
|
|
|
|
/* Full-width I, Small Roman Numeral fifty, Latin Cap Letter IOTA*/
|
|
|
|
const UChar lll_Latin_b[] = {(UChar)0xff29, (UChar)0x217c, (UChar)0x196, 0};
|
|
|
|
|
|
|
|
const UChar lll_Cyrl[] = {(UChar)0x0406, (UChar)0x04C0, (UChar)0x31, 0};
|
|
|
|
|
2010-10-15 00:01:43 +00:00
|
|
|
/* The skeleton transform for all of thes 'lll' lookalikes is all lower case l. */
|
|
|
|
const UChar lll_Skel[] = {(UChar)0x6c, (UChar)0x6c, (UChar)0x6c, 0};
|
2009-03-09 23:40:15 +00:00
|
|
|
|
2011-02-23 23:05:20 +00:00
|
|
|
const UChar han_Hiragana[] = {(UChar)0x3086, (UChar)0x308A, (UChar)0x0020, (UChar)0x77F3, (UChar)0x7530, 0};
|
|
|
|
|
2009-09-18 06:38:49 +00:00
|
|
|
/* Provide better code coverage */
|
|
|
|
const char goodLatinUTF8[] = {0x75, 0x77, 0};
|
2009-03-09 23:40:15 +00:00
|
|
|
|
2015-09-07 01:18:49 +00:00
|
|
|
// Test open from source rules.
|
|
|
|
// Run this in isolation to verify initialization.
|
|
|
|
static void TestOpenFromSource() {
|
|
|
|
// No TEST_SETUP because that calls uspoof_open().
|
|
|
|
UErrorCode status = U_ZERO_ERROR;
|
2009-03-09 23:40:15 +00:00
|
|
|
const char *dataSrcDir;
|
|
|
|
char *fileName;
|
|
|
|
char *confusables;
|
2013-03-21 01:42:01 +00:00
|
|
|
int confusablesLength = 0;
|
2009-03-09 23:40:15 +00:00
|
|
|
char *confusablesWholeScript;
|
2013-03-21 01:42:01 +00:00
|
|
|
int confusablesWholeScriptLength = 0;
|
2009-03-09 23:40:15 +00:00
|
|
|
FILE *f;
|
|
|
|
UParseError pe;
|
|
|
|
int32_t errType;
|
2015-09-07 01:18:49 +00:00
|
|
|
int32_t checkResults;
|
2009-03-09 23:40:15 +00:00
|
|
|
USpoofChecker *rsc;
|
2015-09-07 01:18:49 +00:00
|
|
|
|
2009-03-09 23:40:15 +00:00
|
|
|
dataSrcDir = ctest_dataSrcDir();
|
|
|
|
fileName = malloc(strlen(dataSrcDir) + 100);
|
|
|
|
strcpy(fileName, dataSrcDir);
|
|
|
|
strcat(fileName, U_FILE_SEP_STRING "unidata" U_FILE_SEP_STRING "confusables.txt");
|
2011-09-15 19:34:17 +00:00
|
|
|
f = fopen(fileName, "rb");
|
2009-03-09 23:40:15 +00:00
|
|
|
TEST_ASSERT_NE(f, NULL);
|
|
|
|
confusables = malloc(3000000);
|
2012-09-11 00:22:56 +00:00
|
|
|
if (f != NULL) {
|
2013-03-21 01:42:01 +00:00
|
|
|
confusablesLength = fread(confusables, 1, 3000000, f);
|
|
|
|
fclose(f);
|
2012-09-11 00:22:56 +00:00
|
|
|
}
|
2009-03-09 23:40:15 +00:00
|
|
|
|
|
|
|
strcpy(fileName, dataSrcDir);
|
|
|
|
strcat(fileName, U_FILE_SEP_STRING "unidata" U_FILE_SEP_STRING "confusablesWholeScript.txt");
|
2011-09-15 19:34:17 +00:00
|
|
|
f = fopen(fileName, "rb");
|
2009-03-09 23:40:15 +00:00
|
|
|
TEST_ASSERT_NE(f, NULL);
|
|
|
|
confusablesWholeScript = malloc(1000000);
|
2012-09-11 00:22:56 +00:00
|
|
|
if (f != NULL) {
|
2013-03-21 01:42:01 +00:00
|
|
|
confusablesWholeScriptLength = fread(confusablesWholeScript, 1, 1000000, f);
|
|
|
|
fclose(f);
|
2012-09-11 00:22:56 +00:00
|
|
|
}
|
2009-03-09 23:40:15 +00:00
|
|
|
|
|
|
|
rsc = uspoof_openFromSource(confusables, confusablesLength,
|
2015-09-07 01:18:49 +00:00
|
|
|
confusablesWholeScript, confusablesWholeScriptLength,
|
|
|
|
&errType, &pe, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
|
|
|
|
// Ticket #11860: uspoof_openFromSource() did not initialize for use.
|
|
|
|
// Verify that the spoof checker does not crash.
|
|
|
|
checkResults = uspoof_check(rsc, goodLatin, -1, NULL, &status);
|
2009-03-09 23:40:15 +00:00
|
|
|
TEST_ASSERT_SUCCESS(status);
|
2015-09-07 01:18:49 +00:00
|
|
|
TEST_ASSERT_EQ(0, checkResults);
|
2009-03-09 23:40:15 +00:00
|
|
|
|
|
|
|
free(confusablesWholeScript);
|
|
|
|
free(confusables);
|
|
|
|
free(fileName);
|
|
|
|
uspoof_close(rsc);
|
|
|
|
/* printf("ParseError Line is %d\n", pe.line); */
|
2015-09-07 01:18:49 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Spoof Detection C API Tests
|
|
|
|
*/
|
|
|
|
static void TestUSpoofCAPI(void) {
|
2009-03-28 00:28:35 +00:00
|
|
|
|
2015-09-07 01:18:49 +00:00
|
|
|
/*
|
|
|
|
* basic uspoof_open().
|
|
|
|
*/
|
|
|
|
{
|
|
|
|
USpoofChecker *sc;
|
|
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
|
|
sc = uspoof_open(&status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
if (U_FAILURE(status)) {
|
|
|
|
/* If things are so broken that we can't even open a default spoof checker, */
|
|
|
|
/* don't even try the rest of the tests. They would all fail. */
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
uspoof_close(sc);
|
|
|
|
}
|
2009-03-28 00:28:35 +00:00
|
|
|
|
|
|
|
/*
|
|
|
|
* openFromSerialized and serialize
|
|
|
|
*/
|
|
|
|
TEST_SETUP
|
|
|
|
int32_t serializedSize = 0;
|
|
|
|
int32_t actualLength = 0;
|
|
|
|
char *buf;
|
|
|
|
USpoofChecker *sc2;
|
|
|
|
int32_t checkResults;
|
|
|
|
|
|
|
|
|
|
|
|
serializedSize = uspoof_serialize(sc, NULL, 0, &status);
|
|
|
|
TEST_ASSERT_EQ(status, U_BUFFER_OVERFLOW_ERROR);
|
|
|
|
TEST_ASSERT(serializedSize > 0);
|
|
|
|
|
|
|
|
/* Serialize the default spoof checker */
|
|
|
|
status = U_ZERO_ERROR;
|
|
|
|
buf = (char *)malloc(serializedSize + 10);
|
|
|
|
TEST_ASSERT(buf != NULL);
|
|
|
|
buf[serializedSize] = 42;
|
|
|
|
uspoof_serialize(sc, buf, serializedSize, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT_EQ(42, buf[serializedSize]);
|
|
|
|
|
|
|
|
/* Create a new spoof checker from the freshly serialized data */
|
|
|
|
sc2 = uspoof_openFromSerialized(buf, serializedSize+10, &actualLength, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT_NE(NULL, sc2);
|
|
|
|
TEST_ASSERT_EQ(serializedSize, actualLength);
|
|
|
|
|
|
|
|
/* Verify that the new spoof checker at least wiggles */
|
2009-03-30 23:05:55 +00:00
|
|
|
checkResults = uspoof_check(sc2, goodLatin, -1, NULL, &status);
|
2009-03-28 00:28:35 +00:00
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT_EQ(0, checkResults);
|
|
|
|
|
2009-04-01 01:09:49 +00:00
|
|
|
checkResults = uspoof_check(sc2, scMixed, -1, NULL, &status);
|
2009-03-28 00:28:35 +00:00
|
|
|
TEST_ASSERT_SUCCESS(status);
|
2016-09-13 22:15:13 +00:00
|
|
|
TEST_ASSERT_EQ(USPOOF_SINGLE_SCRIPT, checkResults);
|
2009-03-28 00:28:35 +00:00
|
|
|
|
|
|
|
uspoof_close(sc2);
|
|
|
|
free(buf);
|
|
|
|
TEST_TEARDOWN;
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Set & Get Check Flags
|
|
|
|
*/
|
|
|
|
TEST_SETUP
|
|
|
|
int32_t t;
|
|
|
|
uspoof_setChecks(sc, USPOOF_ALL_CHECKS, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
t = uspoof_getChecks(sc, &status);
|
|
|
|
TEST_ASSERT_EQ(t, USPOOF_ALL_CHECKS);
|
2009-03-09 23:40:15 +00:00
|
|
|
|
2009-03-28 00:28:35 +00:00
|
|
|
uspoof_setChecks(sc, 0, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
t = uspoof_getChecks(sc, &status);
|
|
|
|
TEST_ASSERT_EQ(0, t);
|
|
|
|
|
|
|
|
uspoof_setChecks(sc,
|
|
|
|
USPOOF_WHOLE_SCRIPT_CONFUSABLE | USPOOF_MIXED_SCRIPT_CONFUSABLE | USPOOF_ANY_CASE,
|
|
|
|
&status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
t = uspoof_getChecks(sc, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT_EQ(USPOOF_WHOLE_SCRIPT_CONFUSABLE | USPOOF_MIXED_SCRIPT_CONFUSABLE | USPOOF_ANY_CASE, t);
|
|
|
|
TEST_TEARDOWN;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* get & setAllowedChars
|
|
|
|
*/
|
|
|
|
TEST_SETUP
|
|
|
|
USet *us;
|
|
|
|
const USet *uset;
|
|
|
|
|
|
|
|
uset = uspoof_getAllowedChars(sc, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT(uset_isFrozen(uset));
|
|
|
|
us = uset_open((UChar32)0x41, (UChar32)0x5A); /* [A-Z] */
|
|
|
|
uspoof_setAllowedChars(sc, us, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT_NE(us, uspoof_getAllowedChars(sc, &status));
|
|
|
|
TEST_ASSERT(uset_equals(us, uspoof_getAllowedChars(sc, &status)));
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
uset_close(us);
|
|
|
|
TEST_TEARDOWN;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* clone()
|
|
|
|
*/
|
|
|
|
|
|
|
|
TEST_SETUP
|
|
|
|
USpoofChecker *clone1 = NULL;
|
|
|
|
USpoofChecker *clone2 = NULL;
|
|
|
|
int32_t checkResults = 0;
|
|
|
|
|
|
|
|
clone1 = uspoof_clone(sc, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT_NE(clone1, sc);
|
|
|
|
|
|
|
|
clone2 = uspoof_clone(clone1, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT_NE(clone2, clone1);
|
|
|
|
|
|
|
|
uspoof_close(clone1);
|
|
|
|
|
|
|
|
/* Verify that the cloned spoof checker is alive */
|
2009-03-30 23:05:55 +00:00
|
|
|
checkResults = uspoof_check(clone2, goodLatin, -1, NULL, &status);
|
2009-03-28 00:28:35 +00:00
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT_EQ(0, checkResults);
|
|
|
|
|
2009-04-01 01:09:49 +00:00
|
|
|
checkResults = uspoof_check(clone2, scMixed, -1, NULL, &status);
|
2009-03-28 00:28:35 +00:00
|
|
|
TEST_ASSERT_SUCCESS(status);
|
2016-09-13 22:15:13 +00:00
|
|
|
TEST_ASSERT_EQ(USPOOF_SINGLE_SCRIPT, checkResults);
|
2009-03-30 23:05:55 +00:00
|
|
|
uspoof_close(clone2);
|
2009-03-28 00:28:35 +00:00
|
|
|
TEST_TEARDOWN;
|
|
|
|
|
2011-02-23 23:05:20 +00:00
|
|
|
/*
|
|
|
|
* basic uspoof_check()
|
|
|
|
*/
|
|
|
|
TEST_SETUP
|
|
|
|
int32_t result;
|
|
|
|
result = uspoof_check(sc, goodLatin, -1, NULL, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT_EQ(0, result);
|
|
|
|
|
|
|
|
result = uspoof_check(sc, han_Hiragana, -1, NULL, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT_EQ(0, result);
|
|
|
|
|
|
|
|
result = uspoof_check(sc, scMixed, -1, NULL, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
2016-09-13 22:15:13 +00:00
|
|
|
TEST_ASSERT_EQ(USPOOF_SINGLE_SCRIPT, result);
|
2011-02-23 23:05:20 +00:00
|
|
|
TEST_TEARDOWN
|
|
|
|
|
|
|
|
|
2009-03-28 00:28:35 +00:00
|
|
|
/*
|
|
|
|
* get & set Checks
|
|
|
|
*/
|
|
|
|
TEST_SETUP
|
|
|
|
int32_t checks;
|
|
|
|
int32_t checks2;
|
|
|
|
int32_t checkResults;
|
|
|
|
|
|
|
|
checks = uspoof_getChecks(sc, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT_EQ(USPOOF_ALL_CHECKS, checks);
|
|
|
|
|
2009-03-30 05:08:00 +00:00
|
|
|
checks &= ~(USPOOF_SINGLE_SCRIPT | USPOOF_MIXED_SCRIPT_CONFUSABLE);
|
2009-03-28 00:28:35 +00:00
|
|
|
uspoof_setChecks(sc, checks, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
checks2 = uspoof_getChecks(sc, &status);
|
|
|
|
TEST_ASSERT_EQ(checks, checks2);
|
|
|
|
|
2009-04-01 01:09:49 +00:00
|
|
|
/* The checks that were disabled just above are the same ones that the "scMixed" test fails.
|
2009-03-28 00:28:35 +00:00
|
|
|
So with those tests gone checking that Identifier should now succeed */
|
2009-04-01 01:09:49 +00:00
|
|
|
checkResults = uspoof_check(sc, scMixed, -1, NULL, &status);
|
2009-03-28 00:28:35 +00:00
|
|
|
TEST_ASSERT_SUCCESS(status);
|
2009-03-30 05:08:00 +00:00
|
|
|
TEST_ASSERT_EQ(0, checkResults);
|
2009-03-28 00:28:35 +00:00
|
|
|
TEST_TEARDOWN;
|
|
|
|
|
2009-03-30 23:05:55 +00:00
|
|
|
/*
|
|
|
|
* AllowedLoacles
|
|
|
|
*/
|
|
|
|
|
|
|
|
TEST_SETUP
|
|
|
|
const char *allowedLocales;
|
|
|
|
int32_t checkResults;
|
|
|
|
|
|
|
|
/* Default allowed locales list should be empty */
|
|
|
|
allowedLocales = uspoof_getAllowedLocales(sc, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT(strcmp("", allowedLocales) == 0)
|
|
|
|
|
|
|
|
/* Allow en and ru, which should enable Latin and Cyrillic only to pass */
|
|
|
|
uspoof_setAllowedLocales(sc, "en, ru_RU", &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
allowedLocales = uspoof_getAllowedLocales(sc, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT(strstr(allowedLocales, "en") != NULL);
|
|
|
|
TEST_ASSERT(strstr(allowedLocales, "ru") != NULL);
|
|
|
|
|
|
|
|
/* Limit checks to USPOOF_CHAR_LIMIT. Some of the test data has whole script confusables also,
|
|
|
|
* which we don't want to see in this test. */
|
|
|
|
uspoof_setChecks(sc, USPOOF_CHAR_LIMIT, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
|
|
|
|
checkResults = uspoof_check(sc, goodLatin, -1, NULL, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT_EQ(0, checkResults);
|
|
|
|
|
|
|
|
checkResults = uspoof_check(sc, goodGreek, -1, NULL, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT_EQ(USPOOF_CHAR_LIMIT, checkResults);
|
|
|
|
|
|
|
|
checkResults = uspoof_check(sc, goodCyrl, -1, NULL, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT_EQ(0, checkResults);
|
|
|
|
|
|
|
|
/* Reset with an empty locale list, which should allow all characters to pass */
|
|
|
|
uspoof_setAllowedLocales(sc, " ", &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
|
|
|
|
checkResults = uspoof_check(sc, goodGreek, -1, NULL, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT_EQ(0, checkResults);
|
|
|
|
TEST_TEARDOWN;
|
2009-03-31 00:34:17 +00:00
|
|
|
|
|
|
|
/*
|
|
|
|
* AllowedChars set/get the USet of allowed characters.
|
|
|
|
*/
|
|
|
|
TEST_SETUP
|
|
|
|
const USet *set;
|
|
|
|
USet *tmpSet;
|
|
|
|
int32_t checkResults;
|
|
|
|
|
|
|
|
/* By default, we should see no restriction; the USet should allow all characters. */
|
|
|
|
set = uspoof_getAllowedChars(sc, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
tmpSet = uset_open(0, 0x10ffff);
|
|
|
|
TEST_ASSERT(uset_equals(tmpSet, set));
|
|
|
|
|
|
|
|
/* Setting the allowed chars should enable the check. */
|
|
|
|
uspoof_setChecks(sc, USPOOF_ALL_CHECKS & ~USPOOF_CHAR_LIMIT, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
|
|
|
|
/* Remove a character that is in our good Latin test identifier from the allowed chars set. */
|
|
|
|
uset_remove(tmpSet, goodLatin[1]);
|
|
|
|
uspoof_setAllowedChars(sc, tmpSet, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
uset_close(tmpSet);
|
|
|
|
|
2013-02-11 04:51:14 +00:00
|
|
|
/* Latin Identifier should now fail; other non-latin test cases should still be OK
|
|
|
|
* Note: fail of CHAR_LIMIT also causes the restriction level to be USPOOF_UNRESTRICTIVE
|
|
|
|
* which will give us a USPOOF_RESTRICTION_LEVEL failure.
|
|
|
|
*/
|
2009-03-31 00:34:17 +00:00
|
|
|
checkResults = uspoof_check(sc, goodLatin, -1, NULL, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
2013-02-11 04:51:14 +00:00
|
|
|
TEST_ASSERT_EQ(USPOOF_CHAR_LIMIT | USPOOF_RESTRICTION_LEVEL, checkResults);
|
2009-03-31 00:34:17 +00:00
|
|
|
|
|
|
|
checkResults = uspoof_check(sc, goodGreek, -1, NULL, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
2016-09-13 22:15:13 +00:00
|
|
|
TEST_ASSERT_EQ(0, checkResults);
|
2009-03-31 00:34:17 +00:00
|
|
|
TEST_TEARDOWN;
|
|
|
|
|
2009-04-01 01:09:49 +00:00
|
|
|
/*
|
|
|
|
* check UTF-8
|
|
|
|
*/
|
|
|
|
TEST_SETUP
|
|
|
|
char utf8buf[200];
|
2016-09-13 22:15:13 +00:00
|
|
|
int32_t checkResults, checkResults2;
|
2009-04-01 01:09:49 +00:00
|
|
|
int32_t position;
|
|
|
|
|
|
|
|
u_strToUTF8(utf8buf, sizeof(utf8buf), NULL, goodLatin, -1, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
position = 666;
|
|
|
|
checkResults = uspoof_checkUTF8(sc, utf8buf, -1, &position, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT_EQ(0, checkResults);
|
2013-02-11 04:51:14 +00:00
|
|
|
TEST_ASSERT_EQ(0, position);
|
2009-04-01 01:09:49 +00:00
|
|
|
|
|
|
|
u_strToUTF8(utf8buf, sizeof(utf8buf), NULL, goodCyrl, -1, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
checkResults = uspoof_checkUTF8(sc, utf8buf, -1, &position, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT_EQ(0, checkResults);
|
2009-03-09 23:40:15 +00:00
|
|
|
|
2009-04-01 01:09:49 +00:00
|
|
|
u_strToUTF8(utf8buf, sizeof(utf8buf), NULL, scMixed, -1, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
position = 666;
|
|
|
|
checkResults = uspoof_checkUTF8(sc, utf8buf, -1, &position, &status);
|
2016-09-13 22:15:13 +00:00
|
|
|
checkResults2 = uspoof_check(sc, scMixed, -1, NULL, &status);
|
2009-04-01 01:09:49 +00:00
|
|
|
TEST_ASSERT_SUCCESS(status);
|
2016-09-13 22:15:13 +00:00
|
|
|
TEST_ASSERT_EQ(USPOOF_SINGLE_SCRIPT , checkResults);
|
2013-02-11 04:51:14 +00:00
|
|
|
TEST_ASSERT_EQ(0, position);
|
2016-09-13 22:15:13 +00:00
|
|
|
TEST_ASSERT_EQ(checkResults , checkResults2);
|
|
|
|
|
|
|
|
TEST_TEARDOWN;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* uspoof_check2 variants
|
|
|
|
*/
|
|
|
|
TEST_SETUP
|
|
|
|
int32_t result1, result2;
|
|
|
|
char utf8buf[200];
|
|
|
|
uspoof_setChecks(sc, USPOOF_ALL_CHECKS | USPOOF_AUX_INFO, &status);
|
|
|
|
USpoofCheckResult* checkResult = uspoof_openCheckResult(&status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
|
|
|
|
const UChar* tests[] = { goodLatin, scMixed, scLatin,
|
|
|
|
goodCyrl, goodGreek, lll_Latin_a, lll_Latin_b, han_Hiragana };
|
|
|
|
|
2016-09-20 21:06:55 +00:00
|
|
|
for (int32_t i=0; i<UPRV_LENGTHOF(tests); i++) {
|
2016-09-13 22:15:13 +00:00
|
|
|
const UChar* str = tests[i];
|
|
|
|
|
|
|
|
// Basic test
|
|
|
|
result1 = uspoof_check(sc, str, -1, NULL, &status);
|
|
|
|
result2 = uspoof_check2(sc, str, -1, NULL, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT_EQ(result1, result2);
|
|
|
|
|
|
|
|
// With check result parameter
|
|
|
|
result1 = uspoof_check(sc, str, -1, NULL, &status);
|
|
|
|
result2 = uspoof_check2(sc, str, -1, checkResult, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT_EQ(result1, result2);
|
|
|
|
|
|
|
|
// Checks from checkResult should be same as those from bitmask
|
|
|
|
TEST_ASSERT_EQ(result1 & USPOOF_ALL_CHECKS, uspoof_getCheckResultChecks(checkResult, &status));
|
|
|
|
|
|
|
|
// Restriction level from checkResult should be same as that from bitmask
|
|
|
|
URestrictionLevel restrictionLevel = uspoof_getCheckResultRestrictionLevel(checkResult, &status);
|
|
|
|
TEST_ASSERT_EQ(result1 & restrictionLevel, restrictionLevel);
|
|
|
|
|
|
|
|
// UTF8 endpoint
|
|
|
|
u_strToUTF8(utf8buf, sizeof(utf8buf), NULL, goodLatin, -1, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
result1 = uspoof_checkUTF8(sc, utf8buf, -1, NULL, &status);
|
|
|
|
result2 = uspoof_check2UTF8(sc, utf8buf, -1, NULL, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT_EQ(result1, result2);
|
|
|
|
}
|
2009-04-01 01:09:49 +00:00
|
|
|
|
2016-09-13 22:15:13 +00:00
|
|
|
uspoof_closeCheckResult(checkResult);
|
2009-04-01 01:09:49 +00:00
|
|
|
TEST_TEARDOWN;
|
2009-03-28 00:28:35 +00:00
|
|
|
|
2009-04-01 01:09:49 +00:00
|
|
|
/*
|
|
|
|
* uspoof_areConfusable()
|
|
|
|
*/
|
|
|
|
TEST_SETUP
|
|
|
|
int32_t checkResults;
|
|
|
|
|
2009-04-02 06:08:36 +00:00
|
|
|
checkResults = uspoof_areConfusable(sc, scLatin, -1, scMixed, -1, &status);
|
2009-04-01 01:09:49 +00:00
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT_EQ(USPOOF_MIXED_SCRIPT_CONFUSABLE, checkResults);
|
|
|
|
|
2009-04-02 06:08:36 +00:00
|
|
|
checkResults = uspoof_areConfusable(sc, goodGreek, -1, scLatin, -1, &status);
|
2009-04-01 01:09:49 +00:00
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT_EQ(0, checkResults);
|
|
|
|
|
2009-04-02 06:08:36 +00:00
|
|
|
checkResults = uspoof_areConfusable(sc, lll_Latin_a, -1, lll_Latin_b, -1, &status);
|
2009-04-01 01:09:49 +00:00
|
|
|
TEST_ASSERT_SUCCESS(status);
|
2009-04-22 02:07:40 +00:00
|
|
|
TEST_ASSERT_EQ(USPOOF_SINGLE_SCRIPT_CONFUSABLE, checkResults);
|
2009-03-28 00:28:35 +00:00
|
|
|
|
2009-04-01 01:09:49 +00:00
|
|
|
TEST_TEARDOWN;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* areConfusableUTF8
|
|
|
|
*/
|
|
|
|
TEST_SETUP
|
|
|
|
int32_t checkResults;
|
|
|
|
char s1[200];
|
|
|
|
char s2[200];
|
|
|
|
|
|
|
|
|
|
|
|
u_strToUTF8(s1, sizeof(s1), NULL, scLatin, -1, &status);
|
|
|
|
u_strToUTF8(s2, sizeof(s2), NULL, scMixed, -1, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
2009-04-02 06:08:36 +00:00
|
|
|
checkResults = uspoof_areConfusableUTF8(sc, s1, -1, s2, -1, &status);
|
2009-04-01 01:09:49 +00:00
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT_EQ(USPOOF_MIXED_SCRIPT_CONFUSABLE, checkResults);
|
|
|
|
|
|
|
|
u_strToUTF8(s1, sizeof(s1), NULL, goodGreek, -1, &status);
|
|
|
|
u_strToUTF8(s2, sizeof(s2), NULL, scLatin, -1, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
2009-04-02 06:08:36 +00:00
|
|
|
checkResults = uspoof_areConfusableUTF8(sc, s1, -1, s2, -1, &status);
|
2009-04-01 01:09:49 +00:00
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT_EQ(0, checkResults);
|
|
|
|
|
|
|
|
u_strToUTF8(s1, sizeof(s1), NULL, lll_Latin_a, -1, &status);
|
|
|
|
u_strToUTF8(s2, sizeof(s2), NULL, lll_Latin_b, -1, &status);
|
|
|
|
TEST_ASSERT_SUCCESS(status);
|
2009-04-02 06:08:36 +00:00
|
|
|
checkResults = uspoof_areConfusableUTF8(sc, s1, -1, s2, -1, &status);
|
2009-04-01 01:09:49 +00:00
|
|
|
TEST_ASSERT_SUCCESS(status);
|
2009-04-22 02:07:40 +00:00
|
|
|
TEST_ASSERT_EQ(USPOOF_SINGLE_SCRIPT_CONFUSABLE, checkResults);
|
2009-04-01 01:09:49 +00:00
|
|
|
|
|
|
|
TEST_TEARDOWN;
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
* getSkeleton
|
|
|
|
*/
|
|
|
|
|
|
|
|
TEST_SETUP
|
|
|
|
UChar dest[100];
|
|
|
|
int32_t skelLength;
|
|
|
|
|
2016-02-24 21:48:56 +00:00
|
|
|
skelLength = uspoof_getSkeleton(sc, USPOOF_ANY_CASE, lll_Latin_a, -1, dest, UPRV_LENGTHOF(dest), &status);
|
2009-04-01 01:09:49 +00:00
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT_EQ(0, u_strcmp(lll_Skel, dest));
|
|
|
|
TEST_ASSERT_EQ(u_strlen(lll_Skel), skelLength);
|
|
|
|
|
2010-05-05 15:19:40 +00:00
|
|
|
skelLength = uspoof_getSkeletonUTF8(sc, USPOOF_ANY_CASE, goodLatinUTF8, -1, (char*)dest,
|
2016-02-24 21:48:56 +00:00
|
|
|
UPRV_LENGTHOF(dest), &status);
|
2009-09-18 06:38:49 +00:00
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
|
2009-04-01 01:09:49 +00:00
|
|
|
skelLength = uspoof_getSkeleton(sc, USPOOF_ANY_CASE, lll_Latin_a, -1, NULL, 0, &status);
|
|
|
|
TEST_ASSERT_EQ(U_BUFFER_OVERFLOW_ERROR, status);
|
|
|
|
TEST_ASSERT_EQ(3, skelLength);
|
|
|
|
status = U_ZERO_ERROR;
|
|
|
|
|
|
|
|
TEST_TEARDOWN;
|
2014-12-08 19:56:43 +00:00
|
|
|
|
|
|
|
/*
|
|
|
|
* get Inclusion and Recommended sets
|
|
|
|
*/
|
|
|
|
TEST_SETUP
|
2014-12-08 22:40:31 +00:00
|
|
|
const USet *inclusions = NULL;
|
|
|
|
const USet *recommended = NULL;
|
|
|
|
|
|
|
|
inclusions = uspoof_getInclusionSet(&status);
|
2014-12-08 19:56:43 +00:00
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT_EQ(TRUE, uset_isFrozen(inclusions));
|
|
|
|
|
|
|
|
status = U_ZERO_ERROR;
|
2014-12-08 22:40:31 +00:00
|
|
|
recommended = uspoof_getRecommendedSet(&status);
|
2014-12-08 19:56:43 +00:00
|
|
|
TEST_ASSERT_SUCCESS(status);
|
|
|
|
TEST_ASSERT_EQ(TRUE, uset_isFrozen(recommended));
|
|
|
|
TEST_TEARDOWN;
|
|
|
|
|
2009-04-01 01:09:49 +00:00
|
|
|
}
|
2009-03-28 00:28:35 +00:00
|
|
|
|
2009-05-04 05:45:27 +00:00
|
|
|
#endif /* UCONFIG_NO_REGULAR_EXPRESSIONS */
|