fnmatch.c 8.96 KB
Newer Older
Elliot Lee's avatar
Elliot Lee committed
1
/* Copyright (C) 1991, 1992, 1993 Free Software Foundation, Inc.
2 3
 *
 * This library is free software; you can redistribute it and/or
4
 * modify it under the terms of the GNU Lesser General Public
5 6 7 8 9 10
 * License as published by the Free Software Foundation; either
 * version 2 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
11
 * Lesser General Public License for more details.
12
 *
13
 * You should have received a copy of the GNU Lesser General Public
14 15 16 17
 * License along with this library; if not, write to the
 * Free Software Foundation, Inc., 59 Temple Place - Suite 330,
 * Boston, MA 02111-1307, USA.
 */
Elliot Lee's avatar
Elliot Lee committed
18

19
/*
20
 * Modified by the GTK+ Team and others 1997-2000.  See the AUTHORS
21 22 23 24 25
 * file for a list of people on the GTK+ Team.  See the ChangeLog
 * files for a list of changes.  These files are distributed with
 * GTK+ at ftp://ftp.gtk.org/pub/gtk/. 
 */

26 27 28 29 30
/*
 * Stripped down, converted to UTF-8 and test cases added
 *
 *                    Owen Taylor, 13 December 2002;
 */
Elliot Lee's avatar
Elliot Lee committed
31

32
#include "config.h"
33
#include <string.h>
34

35 36 37 38 39
#include <glib.h>

/* We need to make sure that all constants are defined
 * to properly compile this file
 */
40
#ifndef _GNU_SOURCE
41
#define _GNU_SOURCE
42 43
#endif

44 45 46 47 48
static gunichar
get_char (const char **str)
{
  gunichar c = g_utf8_get_char (*str);
  *str = g_utf8_next_char (*str);
Elliot Lee's avatar
Elliot Lee committed
49

Tor Lillqvist's avatar
Tor Lillqvist committed
50 51
#ifdef G_PLATFORM_WIN32
  c = g_unichar_tolower (c);
52
#endif
Elliot Lee's avatar
Elliot Lee committed
53

54 55
  return c;
}
Elliot Lee's avatar
Elliot Lee committed
56

57 58 59 60 61
#if defined(G_OS_WIN32) || defined(G_WITH_CYGWIN)
#define DO_ESCAPE 0
#else  
#define DO_ESCAPE 1
#endif  
Elliot Lee's avatar
Elliot Lee committed
62

63 64 65 66 67 68 69 70 71 72 73 74
static gunichar
get_unescaped_char (const char **str,
		    gboolean    *was_escaped)
{
  gunichar c = get_char (str);

  *was_escaped = DO_ESCAPE && c == '\\';
  if (*was_escaped)
    c = get_char (str);
  
  return c;
}
Elliot Lee's avatar
Elliot Lee committed
75 76 77 78

/* Match STRING against the filename pattern PATTERN, returning zero if
   it matches, nonzero if not.  */

79 80 81
static gboolean
gtk_fnmatch_intern (const char *pattern,
		    const char *string,
Federico Mena Quintero's avatar
Federico Mena Quintero committed
82 83
		    gboolean    component_start,
		    gboolean    no_leading_period)
84 85 86 87
{
  const char *p = pattern, *n = string;
  
  while (*p)
Elliot Lee's avatar
Elliot Lee committed
88
    {
89 90 91 92 93
      const char *last_n = n;
      
      gunichar c = get_char (&p);
      gunichar nc = get_char (&n);
      
Elliot Lee's avatar
Elliot Lee committed
94 95
      switch (c)
	{
96 97 98 99 100
   	case '?':
	  if (nc == '\0')
	    return FALSE;
	  else if (nc == G_DIR_SEPARATOR)
	    return FALSE;
Federico Mena Quintero's avatar
Federico Mena Quintero committed
101
	  else if (nc == '.' && component_start && no_leading_period)
102
	    return FALSE;
Elliot Lee's avatar
Elliot Lee committed
103 104
	  break;
	case '\\':
105 106 107 108
	  if (DO_ESCAPE)
	    c = get_char (&p);
	  if (nc != c)
	    return FALSE;
Elliot Lee's avatar
Elliot Lee committed
109 110
	  break;
	case '*':
Federico Mena Quintero's avatar
Federico Mena Quintero committed
111
	  if (nc == '.' && component_start && no_leading_period)
112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132
	    return FALSE;

	  {
	    const char *last_p = p;

	    for (last_p = p, c = get_char (&p);
		 c == '?' || c == '*';
		 last_p = p, c = get_char (&p))
	      {
		if (c == '?')
		  {
		    if (nc == '\0')
		      return FALSE;
		    else if (nc == G_DIR_SEPARATOR)
		      return FALSE;
		    else
		      {
			last_n = n; nc = get_char (&n);
		      }
		  }
	      }
Elliot Lee's avatar
Elliot Lee committed
133

134 135 136 137 138 139 140 141 142 143 144
	    /* If the pattern ends with wildcards, we have a
	     * guaranteed match unless there is a dir separator
	     * in the remainder of the string.
	     */
	    if (c == '\0')
	      {
		if (strchr (last_n, G_DIR_SEPARATOR) != NULL)
		  return FALSE;
		else
		  return TRUE;
	      }
Elliot Lee's avatar
Elliot Lee committed
145

146 147
	    if (DO_ESCAPE && c == '\\')
	      c = get_char (&p);
Elliot Lee's avatar
Elliot Lee committed
148

149 150 151
	    for (p = last_p; nc != '\0';)
	      {
		if ((c == '[' || nc == c) &&
Federico Mena Quintero's avatar
Federico Mena Quintero committed
152
		    gtk_fnmatch_intern (p, last_n, component_start, no_leading_period))
153 154 155 156 157 158 159 160
		  return TRUE;
		
		component_start = (nc == G_DIR_SEPARATOR);
		last_n = n;
		nc = get_char (&n);
	      }
		  
	    return FALSE;
Elliot Lee's avatar
Elliot Lee committed
161 162 163 164 165
	  }

	case '[':
	  {
	    /* Nonzero if the sense of the character class is inverted.  */
166 167
	    gboolean not;
	    gboolean was_escaped;
Elliot Lee's avatar
Elliot Lee committed
168

169 170
	    if (nc == '\0' || nc == G_DIR_SEPARATOR)
	      return FALSE;
Elliot Lee's avatar
Elliot Lee committed
171

Federico Mena Quintero's avatar
Federico Mena Quintero committed
172
	    if (nc == '.' && component_start && no_leading_period)
173
	      return FALSE;
Elliot Lee's avatar
Elliot Lee committed
174 175 176 177 178

	    not = (*p == '!' || *p == '^');
	    if (not)
	      ++p;

179
	    c = get_unescaped_char (&p, &was_escaped);
Elliot Lee's avatar
Elliot Lee committed
180 181
	    for (;;)
	      {
182
		register gunichar cstart = c, cend = c;
Elliot Lee's avatar
Elliot Lee committed
183 184
		if (c == '\0')
		  /* [ (unterminated) loses.  */
185
		  return FALSE;
Elliot Lee's avatar
Elliot Lee committed
186

187 188 189
		c = get_unescaped_char (&p, &was_escaped);
		
		if (!was_escaped && c == '-' && *p != ']')
Elliot Lee's avatar
Elliot Lee committed
190
		  {
191
		    cend = get_unescaped_char (&p, &was_escaped);
Elliot Lee's avatar
Elliot Lee committed
192
		    if (cend == '\0')
193
		      return FALSE;
Elliot Lee's avatar
Elliot Lee committed
194

195
		    c = get_char (&p);
Elliot Lee's avatar
Elliot Lee committed
196 197
		  }

198
		if (nc >= cstart && nc <= cend)
Elliot Lee's avatar
Elliot Lee committed
199 200
		  goto matched;

201
		if (!was_escaped && c == ']')
Elliot Lee's avatar
Elliot Lee committed
202 203 204
		  break;
	      }
	    if (!not)
205
	      return FALSE;
Elliot Lee's avatar
Elliot Lee committed
206 207 208 209
	    break;

	  matched:;
	    /* Skip the rest of the [...] that already matched.  */
210 211
	    /* XXX 1003.2d11 is unclear if was_escaped is right.  */
	    while (was_escaped || c != ']')
Elliot Lee's avatar
Elliot Lee committed
212 213 214
	      {
		if (c == '\0')
		  /* [... (unterminated) loses.  */
215
		  return FALSE;
Elliot Lee's avatar
Elliot Lee committed
216

217
		c = get_unescaped_char (&p, &was_escaped);
Elliot Lee's avatar
Elliot Lee committed
218 219
	      }
	    if (not)
220
	      return FALSE;
Elliot Lee's avatar
Elliot Lee committed
221 222 223 224
	  }
	  break;

	default:
225 226
	  if (c != nc)
	    return FALSE;
Elliot Lee's avatar
Elliot Lee committed
227 228
	}

229
      component_start = (nc == G_DIR_SEPARATOR);
Elliot Lee's avatar
Elliot Lee committed
230 231 232
    }

  if (*n == '\0')
233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253
    return TRUE;

  return FALSE;
}

/* Match STRING against the filename pattern PATTERN, returning zero if
 *  it matches, nonzero if not.
 *
 * GTK+ used to use a old version of GNU fnmatch() that was buggy
 * in various ways and didn't handle UTF-8. The following is
 * converted to UTF-8. To simplify the process of making it
 * correct, this is special-cased to the combinations of flags
 * that gtkfilesel.c uses.
 *
 *   FNM_FILE_NAME   - always set
 *   FNM_LEADING_DIR - never set
 *   FNM_NOESCAPE    - set only on windows
 *   FNM_CASEFOLD    - set only on windows
 */
gboolean
_gtk_fnmatch (const char *pattern,
Federico Mena Quintero's avatar
Federico Mena Quintero committed
254 255
	      const char *string,
	      gboolean no_leading_period)
256
{
Federico Mena Quintero's avatar
Federico Mena Quintero committed
257
  return gtk_fnmatch_intern (pattern, string, TRUE, no_leading_period);
258 259
}

Matthias Clasen's avatar
Matthias Clasen committed
260
#undef FNMATCH_TEST_CASES
261
#ifdef FNMATCH_TEST_CASES
Elliot Lee's avatar
Elliot Lee committed
262

Federico Mena Quintero's avatar
Federico Mena Quintero committed
263 264
#define TEST(pat, str, no_leading_period, result) \
  g_assert (_gtk_fnmatch ((pat), (str), (no_leading_period)) == result)
Elliot Lee's avatar
Elliot Lee committed
265

266 267
int main (int argc, char **argv)
{
Federico Mena Quintero's avatar
Federico Mena Quintero committed
268
  TEST ("[a-]", "-", TRUE, TRUE);
269
  
Federico Mena Quintero's avatar
Federico Mena Quintero committed
270 271
  TEST ("a", "a", TRUE, TRUE);
  TEST ("a", "b", TRUE, FALSE);
272 273

  /* Test what ? matches */
Federico Mena Quintero's avatar
Federico Mena Quintero committed
274 275 276 277 278 279
  TEST ("?", "a", TRUE, TRUE);
  TEST ("?", ".", TRUE, FALSE);
  TEST ("a?", "a.", TRUE, TRUE);
  TEST ("a/?", "a/b", TRUE, TRUE);
  TEST ("a/?", "a/.", TRUE, FALSE);
  TEST ("?", "/", TRUE, FALSE);
280 281

  /* Test what * matches */
Federico Mena Quintero's avatar
Federico Mena Quintero committed
282 283 284 285 286 287
  TEST ("*", "a", TRUE, TRUE);
  TEST ("*", ".", TRUE, FALSE);
  TEST ("a*", "a.", TRUE, TRUE);
  TEST ("a/*", "a/b", TRUE, TRUE);
  TEST ("a/*", "a/.", TRUE, FALSE);
  TEST ("*", "/", TRUE, FALSE);
288 289

  /* Range tests */
Federico Mena Quintero's avatar
Federico Mena Quintero committed
290 291 292 293 294 295 296 297 298 299 300 301
  TEST ("[ab]", "a", TRUE, TRUE);
  TEST ("[ab]", "c", TRUE, FALSE);
  TEST ("[^ab]", "a", TRUE, FALSE);
  TEST ("[!ab]", "a", TRUE, FALSE);
  TEST ("[^ab]", "c", TRUE, TRUE);
  TEST ("[!ab]", "c", TRUE, TRUE);
  TEST ("[a-c]", "b", TRUE, TRUE);
  TEST ("[a-c]", "d", TRUE, FALSE);
  TEST ("[a-]", "-", TRUE, TRUE);
  TEST ("[]]", "]", TRUE, TRUE);
  TEST ("[^]]", "a", TRUE, TRUE);
  TEST ("[!]]", "a", TRUE, TRUE);
302 303

  /* Various unclosed ranges */
Federico Mena Quintero's avatar
Federico Mena Quintero committed
304 305 306 307 308
  TEST ("[ab", "a", TRUE, FALSE);
  TEST ("[a-", "a", TRUE, FALSE);
  TEST ("[ab", "c", TRUE, FALSE);
  TEST ("[a-", "c", TRUE, FALSE);
  TEST ("[^]", "a", TRUE, FALSE);
309 310

  /* Ranges and special no-wildcard matches */
Federico Mena Quintero's avatar
Federico Mena Quintero committed
311 312 313 314 315
  TEST ("[.]", ".", TRUE, FALSE);
  TEST ("a[.]", "a.", TRUE, TRUE);
  TEST ("a/[.]", "a/.", TRUE, FALSE);
  TEST ("[/]", "/", TRUE, FALSE);
  TEST ("[^/]", "a", TRUE, TRUE);
316 317
  
  /* Basic tests of * (and combinations of * and ?) */
Federico Mena Quintero's avatar
Federico Mena Quintero committed
318 319 320 321 322 323 324 325 326
  TEST ("a*b", "ab", TRUE, TRUE);
  TEST ("a*b", "axb", TRUE, TRUE);
  TEST ("a*b", "axxb", TRUE, TRUE);
  TEST ("a**b", "ab", TRUE, TRUE);
  TEST ("a**b", "axb", TRUE, TRUE);
  TEST ("a**b", "axxb", TRUE, TRUE);
  TEST ("a*?*b", "ab", TRUE, FALSE);
  TEST ("a*?*b", "axb", TRUE, TRUE);
  TEST ("a*?*b", "axxb", TRUE, TRUE);
327 328

  /* Test of  *[range] */
Federico Mena Quintero's avatar
Federico Mena Quintero committed
329 330 331
  TEST ("a*[cd]", "ac", TRUE, TRUE);
  TEST ("a*[cd]", "axc", TRUE, TRUE);
  TEST ("a*[cd]", "axx", TRUE, FALSE);
332

Federico Mena Quintero's avatar
Federico Mena Quintero committed
333 334
  TEST ("a/[.]", "a/.", TRUE, FALSE);
  TEST ("a*[.]", "a/.", TRUE, FALSE);
335 336 337

  /* Test of UTF-8 */

Federico Mena Quintero's avatar
Federico Mena Quintero committed
338 339 340 341 342 343 344
  TEST ("ä", "ä", TRUE, TRUE);      /* TEST ("ä", "ä", TRUE); */
  TEST ("?", "ä", TRUE, TRUE);       /* TEST ("?", "ä", TRUE); */
  TEST ("*ö", "äö", TRUE, TRUE);   /* TEST ("*ö", "äö", TRUE); */
  TEST ("*ö", "ääö", TRUE, TRUE); /* TEST ("*ö", "ääö", TRUE); */
  TEST ("[ä]", "ä", TRUE, TRUE);    /* TEST ("[ä]", "ä", TRUE); */
  TEST ("[ä-ö]", "é", TRUE, TRUE); /* TEST ("[ä-ö]", "é", TRUE); */
  TEST ("[ä-ö]", "a", TRUE, FALSE); /* TEST ("[ä-ö]", "a", FALSE); */
345 346 347

#ifdef DO_ESCAPE
  /* Tests of escaping */
Federico Mena Quintero's avatar
Federico Mena Quintero committed
348 349 350 351 352 353 354 355 356 357 358
  TEST ("\\\\", "\\", TRUE, TRUE);
  TEST ("\\?", "?", TRUE, TRUE);
  TEST ("\\?", "a", TRUE, FALSE);
  TEST ("\\*", "*", TRUE, TRUE);
  TEST ("\\*", "a", TRUE, FALSE);
  TEST ("\\[a-b]", "[a-b]", TRUE, TRUE);
  TEST ("[\\\\]", "\\", TRUE, TRUE);
  TEST ("[\\^a]", "a", TRUE, TRUE);
  TEST ("[a\\-c]", "b", TRUE, FALSE);
  TEST ("[a\\-c]", "-", TRUE, TRUE);
  TEST ("[a\\]", "a", TRUE, FALSE);
359 360 361
#endif /* DO_ESCAPE */
  
  return 0;
Elliot Lee's avatar
Elliot Lee committed
362 363
}

364
#endif /* FNMATCH_TEST_CASES */