1997-11-24 22:37:52 +00:00
|
|
|
|
/* Copyright (C) 1991, 1992, 1993 Free Software Foundation, Inc.
|
1998-04-13 02:02:47 +00:00
|
|
|
|
*
|
|
|
|
|
* This library is free software; you can redistribute it and/or
|
2000-07-26 11:33:08 +00:00
|
|
|
|
* modify it under the terms of the GNU Lesser General Public
|
1998-04-13 02:02:47 +00:00
|
|
|
|
* License as published by the Free Software Foundation; either
|
|
|
|
|
* version 2 of the License, or (at your option) any later version.
|
|
|
|
|
*
|
|
|
|
|
* This library is distributed in the hope that it will be useful,
|
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
2000-07-26 11:33:08 +00:00
|
|
|
|
* Lesser General Public License for more details.
|
1998-04-13 02:02:47 +00:00
|
|
|
|
*
|
2000-07-26 11:33:08 +00:00
|
|
|
|
* You should have received a copy of the GNU Lesser General Public
|
2012-02-27 13:01:10 +00:00
|
|
|
|
* License along with this library. If not, see <http://www.gnu.org/licenses/>.
|
1998-04-13 02:02:47 +00:00
|
|
|
|
*/
|
1997-11-24 22:37:52 +00:00
|
|
|
|
|
1999-02-24 07:37:18 +00:00
|
|
|
|
/*
|
2000-07-26 11:33:08 +00:00
|
|
|
|
* Modified by the GTK+ Team and others 1997-2000. See the AUTHORS
|
1999-02-24 07:37:18 +00:00
|
|
|
|
* file for a list of people on the GTK+ Team. See the ChangeLog
|
|
|
|
|
* files for a list of changes. These files are distributed with
|
|
|
|
|
* GTK+ at ftp://ftp.gtk.org/pub/gtk/.
|
|
|
|
|
*/
|
|
|
|
|
|
2002-12-13 23:18:03 +00:00
|
|
|
|
/*
|
|
|
|
|
* Stripped down, converted to UTF-8 and test cases added
|
|
|
|
|
*
|
|
|
|
|
* Owen Taylor, 13 December 2002;
|
|
|
|
|
*/
|
1997-11-24 22:37:52 +00:00
|
|
|
|
|
2008-06-22 14:28:52 +00:00
|
|
|
|
#include "config.h"
|
2012-10-02 17:27:25 +00:00
|
|
|
|
|
|
|
|
|
#include "gtkprivate.h"
|
|
|
|
|
|
2002-12-13 23:18:03 +00:00
|
|
|
|
#include <string.h>
|
1997-12-05 04:29:22 +00:00
|
|
|
|
|
2002-12-13 23:18:03 +00:00
|
|
|
|
#include <glib.h>
|
|
|
|
|
|
|
|
|
|
static gunichar
|
2021-06-04 03:55:30 +00:00
|
|
|
|
get_char (const char **str,
|
|
|
|
|
gboolean casefold)
|
2002-12-13 23:18:03 +00:00
|
|
|
|
{
|
|
|
|
|
gunichar c = g_utf8_get_char (*str);
|
|
|
|
|
*str = g_utf8_next_char (*str);
|
1997-11-24 22:37:52 +00:00
|
|
|
|
|
2021-06-04 03:55:30 +00:00
|
|
|
|
if (casefold)
|
|
|
|
|
c = g_unichar_tolower (c);
|
1997-11-24 22:37:52 +00:00
|
|
|
|
|
2002-12-13 23:18:03 +00:00
|
|
|
|
return c;
|
|
|
|
|
}
|
1997-11-24 22:37:52 +00:00
|
|
|
|
|
2002-12-13 23:18:03 +00:00
|
|
|
|
#if defined(G_OS_WIN32) || defined(G_WITH_CYGWIN)
|
|
|
|
|
#define DO_ESCAPE 0
|
|
|
|
|
#else
|
|
|
|
|
#define DO_ESCAPE 1
|
|
|
|
|
#endif
|
1997-11-24 22:37:52 +00:00
|
|
|
|
|
2002-12-13 23:18:03 +00:00
|
|
|
|
static gunichar
|
|
|
|
|
get_unescaped_char (const char **str,
|
2021-06-04 03:55:30 +00:00
|
|
|
|
gboolean *was_escaped,
|
|
|
|
|
gboolean casefold)
|
2002-12-13 23:18:03 +00:00
|
|
|
|
{
|
2021-06-04 03:55:30 +00:00
|
|
|
|
gunichar c = get_char (str, casefold);
|
2002-12-13 23:18:03 +00:00
|
|
|
|
|
|
|
|
|
*was_escaped = DO_ESCAPE && c == '\\';
|
|
|
|
|
if (*was_escaped)
|
2021-06-04 03:55:30 +00:00
|
|
|
|
c = get_char (str, casefold);
|
2002-12-13 23:18:03 +00:00
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
1997-11-24 22:37:52 +00:00
|
|
|
|
|
|
|
|
|
/* Match STRING against the filename pattern PATTERN, returning zero if
|
|
|
|
|
it matches, nonzero if not. */
|
|
|
|
|
|
2002-12-13 23:18:03 +00:00
|
|
|
|
static gboolean
|
|
|
|
|
gtk_fnmatch_intern (const char *pattern,
|
|
|
|
|
const char *string,
|
2004-06-02 17:46:21 +00:00
|
|
|
|
gboolean component_start,
|
2021-06-04 03:55:30 +00:00
|
|
|
|
gboolean no_leading_period,
|
|
|
|
|
gboolean casefold)
|
2002-12-13 23:18:03 +00:00
|
|
|
|
{
|
|
|
|
|
const char *p = pattern, *n = string;
|
|
|
|
|
|
|
|
|
|
while (*p)
|
1997-11-24 22:37:52 +00:00
|
|
|
|
{
|
2002-12-13 23:18:03 +00:00
|
|
|
|
const char *last_n = n;
|
|
|
|
|
|
2021-06-04 03:55:30 +00:00
|
|
|
|
gunichar c = get_char (&p, casefold);
|
|
|
|
|
gunichar nc = get_char (&n, casefold);
|
2002-12-13 23:18:03 +00:00
|
|
|
|
|
1997-11-24 22:37:52 +00:00
|
|
|
|
switch (c)
|
|
|
|
|
{
|
2002-12-13 23:18:03 +00:00
|
|
|
|
case '?':
|
|
|
|
|
if (nc == '\0')
|
|
|
|
|
return FALSE;
|
|
|
|
|
else if (nc == G_DIR_SEPARATOR)
|
|
|
|
|
return FALSE;
|
2004-06-02 17:46:21 +00:00
|
|
|
|
else if (nc == '.' && component_start && no_leading_period)
|
2002-12-13 23:18:03 +00:00
|
|
|
|
return FALSE;
|
1997-11-24 22:37:52 +00:00
|
|
|
|
break;
|
|
|
|
|
case '\\':
|
2002-12-13 23:18:03 +00:00
|
|
|
|
if (DO_ESCAPE)
|
2021-06-04 03:55:30 +00:00
|
|
|
|
c = get_char (&p, casefold);
|
2002-12-13 23:18:03 +00:00
|
|
|
|
if (nc != c)
|
|
|
|
|
return FALSE;
|
1997-11-24 22:37:52 +00:00
|
|
|
|
break;
|
|
|
|
|
case '*':
|
2004-06-02 17:46:21 +00:00
|
|
|
|
if (nc == '.' && component_start && no_leading_period)
|
2002-12-13 23:18:03 +00:00
|
|
|
|
return FALSE;
|
|
|
|
|
|
|
|
|
|
{
|
2021-05-03 11:33:49 +00:00
|
|
|
|
const char *last_p;
|
2002-12-13 23:18:03 +00:00
|
|
|
|
|
2021-06-04 03:55:30 +00:00
|
|
|
|
for (last_p = p, c = get_char (&p, casefold);
|
2002-12-13 23:18:03 +00:00
|
|
|
|
c == '?' || c == '*';
|
2021-06-04 03:55:30 +00:00
|
|
|
|
last_p = p, c = get_char (&p, casefold))
|
2002-12-13 23:18:03 +00:00
|
|
|
|
{
|
|
|
|
|
if (c == '?')
|
|
|
|
|
{
|
|
|
|
|
if (nc == '\0')
|
|
|
|
|
return FALSE;
|
|
|
|
|
else if (nc == G_DIR_SEPARATOR)
|
|
|
|
|
return FALSE;
|
|
|
|
|
else
|
|
|
|
|
{
|
2021-06-04 03:55:30 +00:00
|
|
|
|
last_n = n; nc = get_char (&n, casefold);
|
2002-12-13 23:18:03 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
1997-11-24 22:37:52 +00:00
|
|
|
|
|
2002-12-13 23:18:03 +00:00
|
|
|
|
/* If the pattern ends with wildcards, we have a
|
|
|
|
|
* guaranteed match unless there is a dir separator
|
|
|
|
|
* in the remainder of the string.
|
|
|
|
|
*/
|
|
|
|
|
if (c == '\0')
|
|
|
|
|
{
|
|
|
|
|
if (strchr (last_n, G_DIR_SEPARATOR) != NULL)
|
|
|
|
|
return FALSE;
|
|
|
|
|
else
|
|
|
|
|
return TRUE;
|
|
|
|
|
}
|
1997-11-24 22:37:52 +00:00
|
|
|
|
|
2002-12-13 23:18:03 +00:00
|
|
|
|
if (DO_ESCAPE && c == '\\')
|
2021-06-04 03:55:30 +00:00
|
|
|
|
c = get_char (&p, casefold);
|
1997-11-24 22:37:52 +00:00
|
|
|
|
|
2002-12-13 23:18:03 +00:00
|
|
|
|
for (p = last_p; nc != '\0';)
|
|
|
|
|
{
|
|
|
|
|
if ((c == '[' || nc == c) &&
|
2021-06-04 03:55:30 +00:00
|
|
|
|
gtk_fnmatch_intern (p, last_n, component_start, no_leading_period, casefold))
|
2002-12-13 23:18:03 +00:00
|
|
|
|
return TRUE;
|
|
|
|
|
|
|
|
|
|
component_start = (nc == G_DIR_SEPARATOR);
|
|
|
|
|
last_n = n;
|
2021-06-04 03:55:30 +00:00
|
|
|
|
nc = get_char (&n, casefold);
|
2002-12-13 23:18:03 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return FALSE;
|
1997-11-24 22:37:52 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
case '[':
|
|
|
|
|
{
|
|
|
|
|
/* Nonzero if the sense of the character class is inverted. */
|
2002-12-13 23:18:03 +00:00
|
|
|
|
gboolean not;
|
|
|
|
|
gboolean was_escaped;
|
1997-11-24 22:37:52 +00:00
|
|
|
|
|
2002-12-13 23:18:03 +00:00
|
|
|
|
if (nc == '\0' || nc == G_DIR_SEPARATOR)
|
|
|
|
|
return FALSE;
|
1997-11-24 22:37:52 +00:00
|
|
|
|
|
2004-06-02 17:46:21 +00:00
|
|
|
|
if (nc == '.' && component_start && no_leading_period)
|
2002-12-13 23:18:03 +00:00
|
|
|
|
return FALSE;
|
1997-11-24 22:37:52 +00:00
|
|
|
|
|
|
|
|
|
not = (*p == '!' || *p == '^');
|
|
|
|
|
if (not)
|
|
|
|
|
++p;
|
|
|
|
|
|
2021-06-04 03:55:30 +00:00
|
|
|
|
c = get_unescaped_char (&p, &was_escaped, casefold);
|
1997-11-24 22:37:52 +00:00
|
|
|
|
for (;;)
|
|
|
|
|
{
|
2002-12-13 23:18:03 +00:00
|
|
|
|
register gunichar cstart = c, cend = c;
|
1997-11-24 22:37:52 +00:00
|
|
|
|
if (c == '\0')
|
|
|
|
|
/* [ (unterminated) loses. */
|
2002-12-13 23:18:03 +00:00
|
|
|
|
return FALSE;
|
1997-11-24 22:37:52 +00:00
|
|
|
|
|
2021-06-04 03:55:30 +00:00
|
|
|
|
c = get_unescaped_char (&p, &was_escaped, casefold);
|
2002-12-13 23:18:03 +00:00
|
|
|
|
|
|
|
|
|
if (!was_escaped && c == '-' && *p != ']')
|
1997-11-24 22:37:52 +00:00
|
|
|
|
{
|
2021-06-04 03:55:30 +00:00
|
|
|
|
cend = get_unescaped_char (&p, &was_escaped, casefold);
|
1997-11-24 22:37:52 +00:00
|
|
|
|
if (cend == '\0')
|
2002-12-13 23:18:03 +00:00
|
|
|
|
return FALSE;
|
1997-11-24 22:37:52 +00:00
|
|
|
|
|
2021-06-04 03:55:30 +00:00
|
|
|
|
c = get_char (&p, casefold);
|
1997-11-24 22:37:52 +00:00
|
|
|
|
}
|
|
|
|
|
|
2002-12-13 23:18:03 +00:00
|
|
|
|
if (nc >= cstart && nc <= cend)
|
1997-11-24 22:37:52 +00:00
|
|
|
|
goto matched;
|
|
|
|
|
|
2002-12-13 23:18:03 +00:00
|
|
|
|
if (!was_escaped && c == ']')
|
1997-11-24 22:37:52 +00:00
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
if (!not)
|
2002-12-13 23:18:03 +00:00
|
|
|
|
return FALSE;
|
1997-11-24 22:37:52 +00:00
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
matched:;
|
|
|
|
|
/* Skip the rest of the [...] that already matched. */
|
2002-12-13 23:18:03 +00:00
|
|
|
|
/* XXX 1003.2d11 is unclear if was_escaped is right. */
|
|
|
|
|
while (was_escaped || c != ']')
|
1997-11-24 22:37:52 +00:00
|
|
|
|
{
|
|
|
|
|
if (c == '\0')
|
|
|
|
|
/* [... (unterminated) loses. */
|
2002-12-13 23:18:03 +00:00
|
|
|
|
return FALSE;
|
1997-11-24 22:37:52 +00:00
|
|
|
|
|
2021-06-04 03:55:30 +00:00
|
|
|
|
c = get_unescaped_char (&p, &was_escaped, casefold);
|
1997-11-24 22:37:52 +00:00
|
|
|
|
}
|
|
|
|
|
if (not)
|
2002-12-13 23:18:03 +00:00
|
|
|
|
return FALSE;
|
1997-11-24 22:37:52 +00:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
default:
|
2002-12-13 23:18:03 +00:00
|
|
|
|
if (c != nc)
|
|
|
|
|
return FALSE;
|
1997-11-24 22:37:52 +00:00
|
|
|
|
}
|
|
|
|
|
|
2002-12-13 23:18:03 +00:00
|
|
|
|
component_start = (nc == G_DIR_SEPARATOR);
|
1997-11-24 22:37:52 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (*n == '\0')
|
2002-12-13 23:18:03 +00:00
|
|
|
|
return TRUE;
|
|
|
|
|
|
|
|
|
|
return FALSE;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* Match STRING against the filename pattern PATTERN, returning zero if
|
|
|
|
|
* it matches, nonzero if not.
|
|
|
|
|
*
|
|
|
|
|
* GTK+ used to use a old version of GNU fnmatch() that was buggy
|
2014-02-07 18:32:47 +00:00
|
|
|
|
* in various ways and didn’t handle UTF-8. The following is
|
2002-12-13 23:18:03 +00:00
|
|
|
|
* converted to UTF-8. To simplify the process of making it
|
|
|
|
|
* correct, this is special-cased to the combinations of flags
|
|
|
|
|
* that gtkfilesel.c uses.
|
|
|
|
|
*
|
|
|
|
|
* FNM_FILE_NAME - always set
|
|
|
|
|
* FNM_LEADING_DIR - never set
|
|
|
|
|
* FNM_NOESCAPE - set only on windows
|
|
|
|
|
* FNM_CASEFOLD - set only on windows
|
|
|
|
|
*/
|
|
|
|
|
gboolean
|
|
|
|
|
_gtk_fnmatch (const char *pattern,
|
2004-06-02 17:46:21 +00:00
|
|
|
|
const char *string,
|
2021-06-04 03:55:30 +00:00
|
|
|
|
gboolean no_leading_period,
|
|
|
|
|
gboolean casefold)
|
2002-12-13 23:18:03 +00:00
|
|
|
|
{
|
2021-06-04 03:55:30 +00:00
|
|
|
|
return gtk_fnmatch_intern (pattern, string, TRUE, no_leading_period, casefold);
|
2002-12-13 23:18:03 +00:00
|
|
|
|
}
|