forked from AuroraMiddleware/gtk
359 lines
8.8 KiB
C
359 lines
8.8 KiB
C
/* Copyright (C) 1991, 1992, 1993 Free Software Foundation, Inc.
|
||
*
|
||
* This library is free software; you can redistribute it and/or
|
||
* modify it under the terms of the GNU Lesser General Public
|
||
* License as published by the Free Software Foundation; either
|
||
* version 2 of the License, or (at your option) any later version.
|
||
*
|
||
* This library is distributed in the hope that it will be useful,
|
||
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
||
* Lesser General Public License for more details.
|
||
*
|
||
* You should have received a copy of the GNU Lesser General Public
|
||
* License along with this library. If not, see <http://www.gnu.org/licenses/>.
|
||
*/
|
||
|
||
/*
|
||
* Modified by the GTK+ Team and others 1997-2000. See the AUTHORS
|
||
* file for a list of people on the GTK+ Team. See the ChangeLog
|
||
* files for a list of changes. These files are distributed with
|
||
* GTK+ at ftp://ftp.gtk.org/pub/gtk/.
|
||
*/
|
||
|
||
/*
|
||
* Stripped down, converted to UTF-8 and test cases added
|
||
*
|
||
* Owen Taylor, 13 December 2002;
|
||
*/
|
||
|
||
#include "config.h"
|
||
|
||
#include "gtkprivate.h"
|
||
|
||
#include <string.h>
|
||
|
||
#include <glib.h>
|
||
|
||
static gunichar
|
||
get_char (const char **str)
|
||
{
|
||
gunichar c = g_utf8_get_char (*str);
|
||
*str = g_utf8_next_char (*str);
|
||
|
||
#ifdef G_PLATFORM_WIN32
|
||
c = g_unichar_tolower (c);
|
||
#endif
|
||
|
||
return c;
|
||
}
|
||
|
||
#if defined(G_OS_WIN32) || defined(G_WITH_CYGWIN)
|
||
#define DO_ESCAPE 0
|
||
#else
|
||
#define DO_ESCAPE 1
|
||
#endif
|
||
|
||
static gunichar
|
||
get_unescaped_char (const char **str,
|
||
gboolean *was_escaped)
|
||
{
|
||
gunichar c = get_char (str);
|
||
|
||
*was_escaped = DO_ESCAPE && c == '\\';
|
||
if (*was_escaped)
|
||
c = get_char (str);
|
||
|
||
return c;
|
||
}
|
||
|
||
/* Match STRING against the filename pattern PATTERN, returning zero if
|
||
it matches, nonzero if not. */
|
||
|
||
static gboolean
|
||
gtk_fnmatch_intern (const char *pattern,
|
||
const char *string,
|
||
gboolean component_start,
|
||
gboolean no_leading_period)
|
||
{
|
||
const char *p = pattern, *n = string;
|
||
|
||
while (*p)
|
||
{
|
||
const char *last_n = n;
|
||
|
||
gunichar c = get_char (&p);
|
||
gunichar nc = get_char (&n);
|
||
|
||
switch (c)
|
||
{
|
||
case '?':
|
||
if (nc == '\0')
|
||
return FALSE;
|
||
else if (nc == G_DIR_SEPARATOR)
|
||
return FALSE;
|
||
else if (nc == '.' && component_start && no_leading_period)
|
||
return FALSE;
|
||
break;
|
||
case '\\':
|
||
if (DO_ESCAPE)
|
||
c = get_char (&p);
|
||
if (nc != c)
|
||
return FALSE;
|
||
break;
|
||
case '*':
|
||
if (nc == '.' && component_start && no_leading_period)
|
||
return FALSE;
|
||
|
||
{
|
||
const char *last_p;
|
||
|
||
for (last_p = p, c = get_char (&p);
|
||
c == '?' || c == '*';
|
||
last_p = p, c = get_char (&p))
|
||
{
|
||
if (c == '?')
|
||
{
|
||
if (nc == '\0')
|
||
return FALSE;
|
||
else if (nc == G_DIR_SEPARATOR)
|
||
return FALSE;
|
||
else
|
||
{
|
||
last_n = n; nc = get_char (&n);
|
||
}
|
||
}
|
||
}
|
||
|
||
/* If the pattern ends with wildcards, we have a
|
||
* guaranteed match unless there is a dir separator
|
||
* in the remainder of the string.
|
||
*/
|
||
if (c == '\0')
|
||
{
|
||
if (strchr (last_n, G_DIR_SEPARATOR) != NULL)
|
||
return FALSE;
|
||
else
|
||
return TRUE;
|
||
}
|
||
|
||
if (DO_ESCAPE && c == '\\')
|
||
c = get_char (&p);
|
||
|
||
for (p = last_p; nc != '\0';)
|
||
{
|
||
if ((c == '[' || nc == c) &&
|
||
gtk_fnmatch_intern (p, last_n, component_start, no_leading_period))
|
||
return TRUE;
|
||
|
||
component_start = (nc == G_DIR_SEPARATOR);
|
||
last_n = n;
|
||
nc = get_char (&n);
|
||
}
|
||
|
||
return FALSE;
|
||
}
|
||
|
||
case '[':
|
||
{
|
||
/* Nonzero if the sense of the character class is inverted. */
|
||
gboolean not;
|
||
gboolean was_escaped;
|
||
|
||
if (nc == '\0' || nc == G_DIR_SEPARATOR)
|
||
return FALSE;
|
||
|
||
if (nc == '.' && component_start && no_leading_period)
|
||
return FALSE;
|
||
|
||
not = (*p == '!' || *p == '^');
|
||
if (not)
|
||
++p;
|
||
|
||
c = get_unescaped_char (&p, &was_escaped);
|
||
for (;;)
|
||
{
|
||
register gunichar cstart = c, cend = c;
|
||
if (c == '\0')
|
||
/* [ (unterminated) loses. */
|
||
return FALSE;
|
||
|
||
c = get_unescaped_char (&p, &was_escaped);
|
||
|
||
if (!was_escaped && c == '-' && *p != ']')
|
||
{
|
||
cend = get_unescaped_char (&p, &was_escaped);
|
||
if (cend == '\0')
|
||
return FALSE;
|
||
|
||
c = get_char (&p);
|
||
}
|
||
|
||
if (nc >= cstart && nc <= cend)
|
||
goto matched;
|
||
|
||
if (!was_escaped && c == ']')
|
||
break;
|
||
}
|
||
if (!not)
|
||
return FALSE;
|
||
break;
|
||
|
||
matched:;
|
||
/* Skip the rest of the [...] that already matched. */
|
||
/* XXX 1003.2d11 is unclear if was_escaped is right. */
|
||
while (was_escaped || c != ']')
|
||
{
|
||
if (c == '\0')
|
||
/* [... (unterminated) loses. */
|
||
return FALSE;
|
||
|
||
c = get_unescaped_char (&p, &was_escaped);
|
||
}
|
||
if (not)
|
||
return FALSE;
|
||
}
|
||
break;
|
||
|
||
default:
|
||
if (c != nc)
|
||
return FALSE;
|
||
}
|
||
|
||
component_start = (nc == G_DIR_SEPARATOR);
|
||
}
|
||
|
||
if (*n == '\0')
|
||
return TRUE;
|
||
|
||
return FALSE;
|
||
}
|
||
|
||
/* Match STRING against the filename pattern PATTERN, returning zero if
|
||
* it matches, nonzero if not.
|
||
*
|
||
* GTK+ used to use a old version of GNU fnmatch() that was buggy
|
||
* in various ways and didn’t handle UTF-8. The following is
|
||
* converted to UTF-8. To simplify the process of making it
|
||
* correct, this is special-cased to the combinations of flags
|
||
* that gtkfilesel.c uses.
|
||
*
|
||
* FNM_FILE_NAME - always set
|
||
* FNM_LEADING_DIR - never set
|
||
* FNM_NOESCAPE - set only on windows
|
||
* FNM_CASEFOLD - set only on windows
|
||
*/
|
||
gboolean
|
||
_gtk_fnmatch (const char *pattern,
|
||
const char *string,
|
||
gboolean no_leading_period)
|
||
{
|
||
return gtk_fnmatch_intern (pattern, string, TRUE, no_leading_period);
|
||
}
|
||
|
||
#undef FNMATCH_TEST_CASES
|
||
#ifdef FNMATCH_TEST_CASES
|
||
|
||
#define TEST(pat, str, no_leading_period, result) \
|
||
g_assert (_gtk_fnmatch ((pat), (str), (no_leading_period)) == result)
|
||
|
||
int main (int argc, char **argv)
|
||
{
|
||
TEST ("[a-]", "-", TRUE, TRUE);
|
||
|
||
TEST ("a", "a", TRUE, TRUE);
|
||
TEST ("a", "b", TRUE, FALSE);
|
||
|
||
/* Test what ? matches */
|
||
TEST ("?", "a", TRUE, TRUE);
|
||
TEST ("?", ".", TRUE, FALSE);
|
||
TEST ("a?", "a.", TRUE, TRUE);
|
||
TEST ("a/?", "a/b", TRUE, TRUE);
|
||
TEST ("a/?", "a/.", TRUE, FALSE);
|
||
TEST ("?", "/", TRUE, FALSE);
|
||
|
||
/* Test what * matches */
|
||
TEST ("*", "a", TRUE, TRUE);
|
||
TEST ("*", ".", TRUE, FALSE);
|
||
TEST ("a*", "a.", TRUE, TRUE);
|
||
TEST ("a/*", "a/b", TRUE, TRUE);
|
||
TEST ("a/*", "a/.", TRUE, FALSE);
|
||
TEST ("*", "/", TRUE, FALSE);
|
||
|
||
/* Range tests */
|
||
TEST ("[ab]", "a", TRUE, TRUE);
|
||
TEST ("[ab]", "c", TRUE, FALSE);
|
||
TEST ("[^ab]", "a", TRUE, FALSE);
|
||
TEST ("[!ab]", "a", TRUE, FALSE);
|
||
TEST ("[^ab]", "c", TRUE, TRUE);
|
||
TEST ("[!ab]", "c", TRUE, TRUE);
|
||
TEST ("[a-c]", "b", TRUE, TRUE);
|
||
TEST ("[a-c]", "d", TRUE, FALSE);
|
||
TEST ("[a-]", "-", TRUE, TRUE);
|
||
TEST ("[]]", "]", TRUE, TRUE);
|
||
TEST ("[^]]", "a", TRUE, TRUE);
|
||
TEST ("[!]]", "a", TRUE, TRUE);
|
||
|
||
/* Various unclosed ranges */
|
||
TEST ("[ab", "a", TRUE, FALSE);
|
||
TEST ("[a-", "a", TRUE, FALSE);
|
||
TEST ("[ab", "c", TRUE, FALSE);
|
||
TEST ("[a-", "c", TRUE, FALSE);
|
||
TEST ("[^]", "a", TRUE, FALSE);
|
||
|
||
/* Ranges and special no-wildcard matches */
|
||
TEST ("[.]", ".", TRUE, FALSE);
|
||
TEST ("a[.]", "a.", TRUE, TRUE);
|
||
TEST ("a/[.]", "a/.", TRUE, FALSE);
|
||
TEST ("[/]", "/", TRUE, FALSE);
|
||
TEST ("[^/]", "a", TRUE, TRUE);
|
||
|
||
/* Basic tests of * (and combinations of * and ?) */
|
||
TEST ("a*b", "ab", TRUE, TRUE);
|
||
TEST ("a*b", "axb", TRUE, TRUE);
|
||
TEST ("a*b", "axxb", TRUE, TRUE);
|
||
TEST ("a**b", "ab", TRUE, TRUE);
|
||
TEST ("a**b", "axb", TRUE, TRUE);
|
||
TEST ("a**b", "axxb", TRUE, TRUE);
|
||
TEST ("a*?*b", "ab", TRUE, FALSE);
|
||
TEST ("a*?*b", "axb", TRUE, TRUE);
|
||
TEST ("a*?*b", "axxb", TRUE, TRUE);
|
||
|
||
/* Test of *[range] */
|
||
TEST ("a*[cd]", "ac", TRUE, TRUE);
|
||
TEST ("a*[cd]", "axc", TRUE, TRUE);
|
||
TEST ("a*[cd]", "axx", TRUE, FALSE);
|
||
|
||
TEST ("a/[.]", "a/.", TRUE, FALSE);
|
||
TEST ("a*[.]", "a/.", TRUE, FALSE);
|
||
|
||
/* Test of UTF-8 */
|
||
|
||
TEST ("ä", "ä", TRUE, TRUE); /* TEST ("ä", "ä", TRUE); */
|
||
TEST ("?", "ä", TRUE, TRUE); /* TEST ("?", "ä", TRUE); */
|
||
TEST ("*ö", "äö", TRUE, TRUE); /* TEST ("*ö", "äö", TRUE); */
|
||
TEST ("*ö", "ääö", TRUE, TRUE); /* TEST ("*ö", "ääö", TRUE); */
|
||
TEST ("[ä]", "ä", TRUE, TRUE); /* TEST ("[ä]", "ä", TRUE); */
|
||
TEST ("[ä-ö]", "é", TRUE, TRUE); /* TEST ("[ä-ö]", "é", TRUE); */
|
||
TEST ("[ä-ö]", "a", TRUE, FALSE); /* TEST ("[ä-ö]", "a", FALSE); */
|
||
|
||
#ifdef DO_ESCAPE
|
||
/* Tests of escaping */
|
||
TEST ("\\\\", "\\", TRUE, TRUE);
|
||
TEST ("\\?", "?", TRUE, TRUE);
|
||
TEST ("\\?", "a", TRUE, FALSE);
|
||
TEST ("\\*", "*", TRUE, TRUE);
|
||
TEST ("\\*", "a", TRUE, FALSE);
|
||
TEST ("\\[a-b]", "[a-b]", TRUE, TRUE);
|
||
TEST ("[\\\\]", "\\", TRUE, TRUE);
|
||
TEST ("[\\^a]", "a", TRUE, TRUE);
|
||
TEST ("[a\\-c]", "b", TRUE, FALSE);
|
||
TEST ("[a\\-c]", "-", TRUE, TRUE);
|
||
TEST ("[a\\]", "a", TRUE, FALSE);
|
||
#endif /* DO_ESCAPE */
|
||
|
||
return 0;
|
||
}
|
||
|
||
#endif /* FNMATCH_TEST_CASES */
|