1
0
mirror of https://github.com/samba-team/samba.git synced 2024-12-24 21:34:56 +03:00

r2778: merged the new samba4 ms_fnmatch code to Samba3. Thanks to Rusty

Russel for some help in designing the new algorithm.
(This used to be commit 38144f8d2c)
This commit is contained in:
Andrew Tridgell 2004-10-02 09:14:43 +00:00 committed by Gerald (Jerry) Carter
parent 96876f696e
commit 640f124ca2

View File

@ -1,7 +1,7 @@
/*
Unix SMB/CIFS implementation.
filename matching routine
Copyright (C) Andrew Tridgell 1992-1998
Copyright (C) Andrew Tridgell 1992-2004
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
@ -15,238 +15,193 @@
You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. */
Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
*/
/*
This module was originally based on fnmatch.c copyright by the Free
Software Foundation. It bears little resemblence to that code now
Software Foundation. It bears little (if any) resemblence to that
code now
*/
#if FNMATCH_TEST
#include <stdio.h>
#include <stdlib.h>
#else
#include "includes.h"
#endif
/*
bugger. we need a separate wildcard routine for older versions
of the protocol. This is not yet perfect, but its a lot
better than what we had */
static int ms_fnmatch_lanman_core(const smb_ucs2_t *pattern,
const smb_ucs2_t *string,
BOOL case_sensitive)
static int null_match(const smb_ucs2_t *p)
{
const smb_ucs2_t *p = pattern, *n = string;
smb_ucs2_t c;
if (strcmp_wa(p, "?")==0 && strcmp_wa(n, ".")) goto match;
while ((c = *p++)) {
switch (c) {
case UCS2_CHAR('.'):
if (! *n) goto next;
if (*n != UCS2_CHAR('.')) goto nomatch;
n++;
break;
case UCS2_CHAR('?'):
if (! *n) goto next;
if ((*n == UCS2_CHAR('.') &&
n[1] != UCS2_CHAR('.')) || ! *n)
goto next;
n++;
break;
case UCS2_CHAR('>'):
if (! *n) goto next;
if (n[0] == UCS2_CHAR('.')) {
if (! n[1] && ms_fnmatch_lanman_core(p, n+1, case_sensitive) == 0) goto match;
if (ms_fnmatch_lanman_core(p, n, case_sensitive) == 0) goto match;
goto nomatch;
}
n++;
break;
case UCS2_CHAR('*'):
if (! *n) goto next;
if (! *p) goto match;
for (; *n; n++) {
if (ms_fnmatch_lanman_core(p, n, case_sensitive) == 0) goto match;
}
break;
case UCS2_CHAR('<'):
for (; *n; n++) {
if (ms_fnmatch_lanman_core(p, n, case_sensitive) == 0) goto match;
if (*n == UCS2_CHAR('.') &&
!strchr_w(n+1,UCS2_CHAR('.'))) {
n++;
break;
}
}
break;
case UCS2_CHAR('"'):
if (*n == 0 && ms_fnmatch_lanman_core(p, n, case_sensitive) == 0) goto match;
if (*n != UCS2_CHAR('.')) goto nomatch;
n++;
break;
default:
if (case_sensitive) {
if (c != *n) goto nomatch;
} else {
if (tolower_w(c) != tolower_w(*n)) goto nomatch;
}
n++;
}
for (;*p;p++) {
if (*p != UCS2_CHAR('*') &&
*p != UCS2_CHAR('<') &&
*p != UCS2_CHAR('"') &&
*p != UCS2_CHAR('>')) return -1;
}
if (! *n) goto match;
nomatch:
/*
if (verbose) printf("NOMATCH pattern=[%s] string=[%s]\n", pattern, string);
*/
return -1;
next:
if (ms_fnmatch_lanman_core(p, n, case_sensitive) == 0) goto match;
goto nomatch;
match:
/*
if (verbose) printf("MATCH pattern=[%s] string=[%s]\n", pattern, string);
*/
return 0;
}
static int ms_fnmatch_lanman1(const smb_ucs2_t *pattern,
const smb_ucs2_t *string, BOOL case_sensitive)
{
if (!strpbrk_wa(pattern, "?*<>\"")) {
smb_ucs2_t s[] = {UCS2_CHAR('.'), 0};
if (strcmp_wa(string,"..") == 0) string = s;
return strcasecmp_w(pattern, string);
}
if (strcmp_wa(string,"..") == 0 || strcmp_wa(string,".") == 0) {
smb_ucs2_t dot[] = {UCS2_CHAR('.'), 0};
smb_ucs2_t dotdot[] = {UCS2_CHAR('.'), UCS2_CHAR('.'), 0};
return ms_fnmatch_lanman_core(pattern, dotdot, case_sensitive) &&
ms_fnmatch_lanman_core(pattern, dot, case_sensitive);
}
return ms_fnmatch_lanman_core(pattern, string, case_sensitive);
}
/* the following function was derived using the masktest utility -
after years of effort we finally have a perfect MS wildcard
matching routine!
NOTE: this matches only filenames with no directory component
Returns 0 on match, -1 on fail.
/*
the max_n structure is purely for efficiency, it doesn't contribute
to the matching algorithm except by ensuring that the algorithm does
not grow exponentially
*/
static int ms_fnmatch_w(const smb_ucs2_t *pattern, const smb_ucs2_t *string,
int protocol, BOOL case_sensitive)
{
const smb_ucs2_t *p = pattern, *n = string;
smb_ucs2_t c;
struct max_n {
const smb_ucs2_t *predot;
const smb_ucs2_t *postdot;
};
if (protocol <= PROTOCOL_LANMAN2) {
return ms_fnmatch_lanman1(pattern, string, case_sensitive);
}
/*
p and n are the pattern and string being matched. The max_n array is
an optimisation only. The ldot pointer is NULL if the string does
not contain a '.', otherwise it points at the last dot in 'n'.
*/
static int ms_fnmatch_core(const smb_ucs2_t *p, const smb_ucs2_t *n,
struct max_n *max_n, const smb_ucs2_t *ldot)
{
smb_ucs2_t c;
int i;
while ((c = *p++)) {
switch (c) {
case UCS2_CHAR('?'):
if (! *n) return -1;
n++;
break;
case UCS2_CHAR('>'):
if (n[0] == UCS2_CHAR('.')) {
if (! n[1] && ms_fnmatch_w(p, n+1, protocol, case_sensitive) == 0) return 0;
if (ms_fnmatch_w(p, n, protocol, case_sensitive) == 0) return 0;
return -1;
}
if (! *n) return ms_fnmatch_w(p, n, protocol, case_sensitive);
n++;
break;
/* a '*' matches zero or more characters of any type */
case UCS2_CHAR('*'):
while (*p == UCS2_CHAR('*')) {
p++;
if (max_n->predot && max_n->predot <= n) {
return null_match(p);
}
for (; *n; n++) {
if (ms_fnmatch_w(p, n, protocol, case_sensitive) == 0) return 0;
}
break;
case UCS2_CHAR('<'):
for (; *n; n++) {
if (ms_fnmatch_w(p, n, protocol, case_sensitive) == 0) return 0;
if (*n == UCS2_CHAR('.') && !strchr_wa(n+1,'.')) {
n++;
break;
for (i=0; n[i]; i++) {
if (ms_fnmatch_core(p, n+i, max_n+1, ldot) == 0) {
return 0;
}
}
if (!max_n->predot || max_n->predot > n) max_n->predot = n;
return null_match(p);
/* a '<' matches zero or more characters of
any type, but stops matching at the last
'.' in the string. */
case UCS2_CHAR('<'):
if (max_n->predot && max_n->predot <= n) {
return null_match(p);
}
if (max_n->postdot && max_n->postdot <= n && n <= ldot) {
return -1;
}
for (i=0; n[i]; i++) {
if (ms_fnmatch_core(p, n+i, max_n+1, ldot) == 0) return 0;
if (n+i == ldot) {
if (ms_fnmatch_core(p, n+i+1, max_n+1, ldot) == 0) return 0;
if (!max_n->postdot || max_n->postdot > n) max_n->postdot = n;
return -1;
}
}
if (!max_n->predot || max_n->predot > n) max_n->predot = n;
return null_match(p);
/* a '?' matches any single character */
case UCS2_CHAR('?'):
if (! *n) {
return -1;
}
n++;
break;
/* a '?' matches any single character */
case UCS2_CHAR('>'):
if (n[0] == UCS2_CHAR('.')) {
if (! n[1] && null_match(p) == 0) {
return 0;
}
break;
}
if (! *n) return null_match(p);
n++;
break;
case UCS2_CHAR('"'):
if (*n == 0 && ms_fnmatch_w(p, n, protocol, case_sensitive) == 0) return 0;
if (*n == 0 && null_match(p) == 0) {
return 0;
}
if (*n != UCS2_CHAR('.')) return -1;
n++;
break;
default:
if (case_sensitive) {
if (c != *n) return -1;
} else {
if (tolower_w(c) != tolower_w(*n)) return -1;
if (c != *n && toupper_w(c) != toupper_w(*n)) {
return -1;
}
n++;
break;
}
}
if (! *n) return 0;
if (! *n) {
return 0;
}
return -1;
}
int ms_fnmatch(const char *pattern, const char *string, int protocol,
BOOL case_senstive)
int ms_fnmatch(const char *pattern, const char *string, enum protocol_types protocol)
{
wpstring buffer_pattern, buffer_string;
int ret;
size_t size;
wpstring p, s;
int ret, count, i;
struct max_n *max_n = NULL;
size = push_ucs2(NULL, buffer_pattern, pattern, sizeof(buffer_pattern), STR_TERMINATE);
if (size == (size_t)-1) {
return -1;
/* Not quite the right answer, but finding the right one
under this failure case is expensive, and it's pretty close */
}
size = push_ucs2(NULL, buffer_string, string, sizeof(buffer_string), STR_TERMINATE);
if (size == (size_t)-1) {
return -1;
/* Not quite the right answer, but finding the right one
under this failure case is expensive, and it's pretty close */
if (strcmp(string, "..") == 0) {
string = ".";
}
ret = ms_fnmatch_w(buffer_pattern, buffer_string, protocol, case_senstive);
DEBUG(10,("ms_fnmatch(%s,%s) -> %d\n", pattern, string, ret));
if (strpbrk(pattern, "<>*?\"") == NULL) {
/* this is not just an optmisation - it is essential
for LANMAN1 correctness */
return StrCaseCmp(pattern, string);
}
pstrcpy_wa(p, pattern);
pstrcpy_wa(s, string);
if (protocol <= PROTOCOL_LANMAN2) {
/*
for older negotiated protocols it is possible to
translate the pattern to produce a "new style"
pattern that exactly matches w2k behaviour
*/
for (i=0;p[i];i++) {
if (p[i] == UCS2_CHAR('?')) {
p[i] = UCS2_CHAR('>');
} else if (p[i] == UCS2_CHAR('.') &&
(p[i+1] == UCS2_CHAR('?') ||
p[i+1] == UCS2_CHAR('*') ||
p[i+1] == 0)) {
p[i] = UCS2_CHAR('"');
} else if (p[i] == UCS2_CHAR('*') && p[i+1] == UCS2_CHAR('.')) {
p[i] = UCS2_CHAR('<');
}
}
}
for (count=i=0;p[i];i++) {
if (p[i] == UCS2_CHAR('*') || p[i] == UCS2_CHAR('<')) count++;
}
if (count != 0) {
max_n = calloc(sizeof(struct max_n), count);
if (!max_n) {
return -1;
}
}
ret = ms_fnmatch_core(p, s, max_n, strrchr_w(s, UCS2_CHAR('.')));
if (max_n) {
free(max_n);
}
return ret;
}
/* a generic fnmatch function - uses for non-CIFS pattern matching */
int gen_fnmatch(const char *pattern, const char *string)
{
return ms_fnmatch(pattern, string, PROTOCOL_NT1, True);
return ms_fnmatch(pattern, string, PROTOCOL_NT1);
}