2014-08-06 16:09:23 -07:00
# include <linux/module.h>
# include <linux/glob.h>
/*
* The only reason this code can be compiled as a module is because the
* ATA code that depends on it can be as well . In practice , they ' re
* both usually compiled in and the module overhead goes away .
*/
MODULE_DESCRIPTION ( " glob(7) matching " ) ;
MODULE_LICENSE ( " Dual MIT/GPL " ) ;
/**
* glob_match - Shell - style pattern matching , like ! fnmatch ( pat , str , 0 )
* @ pat : Shell - style pattern to match , e . g . " *.[ch] " .
* @ str : String to match . The pattern must match the entire string .
*
* Perform shell - style glob matching , returning true ( 1 ) if the match
* succeeds , or false ( 0 ) if it fails . Equivalent to ! fnmatch ( @ pat , @ str , 0 ) .
*
* Pattern metacharacters are ? , * , [ and \ .
* ( And , inside character classes , ! , - and ] . )
*
* This is small and simple implementation intended for device blacklists
* where a string is matched against a number of patterns . Thus , it
* does not preprocess the patterns . It is non - recursive , and run - time
* is at most quadratic : strlen ( @ str ) * strlen ( @ pat ) .
*
* An example of the worst case is glob_match ( " *aaaaa " , " aaaaaaaaaa " ) ;
* it takes 6 passes over the pattern before matching the string .
*
* Like ! fnmatch ( @ pat , @ str , 0 ) and unlike the shell , this does NOT
* treat / or leading . specially ; it isn ' t actually used for pathnames .
*
* Note that according to glob ( 7 ) ( and unlike bash ) , character classes
* are complemented by a leading ! ; this does not support the regex - style
* [ ^ a - z ] syntax .
*
* An opening bracket without a matching close is matched literally .
*/
bool __pure glob_match ( char const * pat , char const * str )
{
/*
* Backtrack to previous * on mismatch and retry starting one
* character later in the string . Because * matches all characters
* ( no exception for / ) , it can be easily proved that there ' s
* never a need to backtrack multiple levels .
*/
char const * back_pat = NULL , * back_str = back_str ;
/*
* Loop over each token ( character or class ) in pat , matching
* it against the remaining unmatched tail of str . Return false
* on mismatch , or true after matching the trailing nul bytes .
*/
for ( ; ; ) {
unsigned char c = * str + + ;
unsigned char d = * pat + + ;
switch ( d ) {
case ' ? ' : /* Wildcard: anything but nul */
if ( c = = ' \0 ' )
return false ;
break ;
case ' * ' : /* Any-length wildcard */
if ( * pat = = ' \0 ' ) /* Optimize trailing * case */
return true ;
back_pat = pat ;
back_str = - - str ; /* Allow zero-length match */
break ;
case ' [ ' : { /* Character class */
bool match = false , inverted = ( * pat = = ' ! ' ) ;
char const * class = pat + inverted ;
unsigned char a = * class + + ;
/*
* Iterate over each span in the character class .
* A span is either a single character a , or a
* range a - b . The first span may begin with ' ] ' .
*/
do {
unsigned char b = a ;
if ( a = = ' \0 ' ) /* Malformed */
goto literal ;
if ( class [ 0 ] = = ' - ' & & class [ 1 ] ! = ' ] ' ) {
b = class [ 1 ] ;
if ( b = = ' \0 ' )
goto literal ;
class + = 2 ;
/* Any special action if a > b? */
}
match | = ( a < = c & & c < = b ) ;
} while ( ( a = * class + + ) ! = ' ] ' ) ;
if ( match = = inverted )
goto backtrack ;
pat = class ;
}
break ;
case ' \\ ' :
d = * pat + + ;
/*FALLTHROUGH*/
default : /* Literal character */
literal :
if ( c = = d ) {
if ( d = = ' \0 ' )
return true ;
break ;
}
backtrack :
if ( c = = ' \0 ' | | ! back_pat )
return false ; /* No point continuing */
/* Try again from last *, one character later in str. */
pat = back_pat ;
str = + + back_str ;
break ;
}
}
}
EXPORT_SYMBOL ( glob_match ) ;
2014-08-06 16:09:25 -07:00
# ifdef CONFIG_GLOB_SELFTEST
# include <linux/printk.h>
# include <linux/moduleparam.h>
/* Boot with "glob.verbose=1" to show successful tests, too */
static bool verbose = false ;
module_param ( verbose , bool , 0 ) ;
struct glob_test {
char const * pat , * str ;
bool expected ;
} ;
static bool __pure __init test ( char const * pat , char const * str , bool expected )
{
bool match = glob_match ( pat , str ) ;
bool success = match = = expected ;
/* Can't get string literals into a particular section, so... */
static char const msg_error [ ] __initconst =
KERN_ERR " glob: \" %s \" vs. \" %s \" : %s *** ERROR *** \n " ;
static char const msg_ok [ ] __initconst =
KERN_DEBUG " glob: \" %s \" vs. \" %s \" : %s OK \n " ;
static char const mismatch [ ] __initconst = " mismatch " ;
char const * message ;
if ( ! success )
message = msg_error ;
else if ( verbose )
message = msg_ok ;
else
return success ;
printk ( message , pat , str , mismatch + 3 * match ) ;
return success ;
}
/*
* The tests are all jammed together in one array to make it simpler
* to place that array in the . init . rodata section . The obvious
* " array of structures containing char * " has no way to force the
* pointed - to strings to be in a particular section .
*
* Anyway , a test consists of :
* 1. Expected glob_match result : ' 1 ' or ' 0 ' .
* 2. Pattern to match : null - terminated string
* 3. String to match against : null - terminated string
*
* The list of tests is terminated with a final ' \0 ' instead of
* a glob_match result character .
*/
static char const glob_tests [ ] __initconst =
/* Some basic tests */
" 1 " " a \0 " " a \0 "
" 0 " " a \0 " " b \0 "
" 0 " " a \0 " " aa \0 "
" 0 " " a \0 " " \0 "
" 1 " " \0 " " \0 "
" 0 " " \0 " " a \0 "
/* Simple character class tests */
" 1 " " [a] \0 " " a \0 "
" 0 " " [a] \0 " " b \0 "
" 0 " " [!a] \0 " " a \0 "
" 1 " " [!a] \0 " " b \0 "
" 1 " " [ab] \0 " " a \0 "
" 1 " " [ab] \0 " " b \0 "
" 0 " " [ab] \0 " " c \0 "
" 1 " " [!ab] \0 " " c \0 "
" 1 " " [a-c] \0 " " b \0 "
" 0 " " [a-c] \0 " " d \0 "
/* Corner cases in character class parsing */
" 1 " " [a-c-e-g] \0 " " - \0 "
" 0 " " [a-c-e-g] \0 " " d \0 "
" 1 " " [a-c-e-g] \0 " " f \0 "
" 1 " " []a-ceg-ik[] \0 " " a \0 "
" 1 " " []a-ceg-ik[] \0 " " ] \0 "
" 1 " " []a-ceg-ik[] \0 " " [ \0 "
" 1 " " []a-ceg-ik[] \0 " " h \0 "
" 0 " " []a-ceg-ik[] \0 " " f \0 "
" 0 " " [!]a-ceg-ik[] \0 " " h \0 "
" 0 " " [!]a-ceg-ik[] \0 " " ] \0 "
" 1 " " [!]a-ceg-ik[] \0 " " f \0 "
/* Simple wild cards */
" 1 " " ? \0 " " a \0 "
" 0 " " ? \0 " " aa \0 "
" 0 " " ?? \0 " " a \0 "
" 1 " " ?x? \0 " " axb \0 "
" 0 " " ?x? \0 " " abx \0 "
" 0 " " ?x? \0 " " xab \0 "
/* Asterisk wild cards (backtracking) */
" 0 " " *?? \0 " " a \0 "
" 1 " " *?? \0 " " ab \0 "
" 1 " " *?? \0 " " abc \0 "
" 1 " " *?? \0 " " abcd \0 "
" 0 " " ??* \0 " " a \0 "
" 1 " " ??* \0 " " ab \0 "
" 1 " " ??* \0 " " abc \0 "
" 1 " " ??* \0 " " abcd \0 "
" 0 " " ?*? \0 " " a \0 "
" 1 " " ?*? \0 " " ab \0 "
" 1 " " ?*? \0 " " abc \0 "
" 1 " " ?*? \0 " " abcd \0 "
" 1 " " *b \0 " " b \0 "
" 1 " " *b \0 " " ab \0 "
" 0 " " *b \0 " " ba \0 "
" 1 " " *b \0 " " bb \0 "
" 1 " " *b \0 " " abb \0 "
" 1 " " *b \0 " " bab \0 "
" 1 " " *bc \0 " " abbc \0 "
" 1 " " *bc \0 " " bc \0 "
" 1 " " *bc \0 " " bbc \0 "
" 1 " " *bc \0 " " bcbc \0 "
/* Multiple asterisks (complex backtracking) */
" 1 " " *ac* \0 " " abacadaeafag \0 "
" 1 " " *ac*ae*ag* \0 " " abacadaeafag \0 "
" 1 " " *a*b*[bc]*[ef]*g* \0 " " abacadaeafag \0 "
" 0 " " *a*b*[ef]*[cd]*g* \0 " " abacadaeafag \0 "
" 1 " " *abcd* \0 " " abcabcabcabcdefg \0 "
" 1 " " *ab*cd* \0 " " abcabcabcabcdefg \0 "
" 1 " " *abcd*abcdef* \0 " " abcabcdabcdeabcdefg \0 "
" 0 " " *abcd* \0 " " abcabcabcabcefg \0 "
" 0 " " *ab*cd* \0 " " abcabcabcabcefg \0 " ;
static int __init glob_init ( void )
{
unsigned successes = 0 ;
unsigned n = 0 ;
char const * p = glob_tests ;
static char const message [ ] __initconst =
KERN_INFO " glob: %u self-tests passed, %u failed \n " ;
/*
* Tests are jammed together in a string . The first byte is ' 1 '
* or ' 0 ' to indicate the expected outcome , or ' \0 ' to indicate the
* end of the tests . Then come two null - terminated strings : the
* pattern and the string to match it against .
*/
while ( * p ) {
bool expected = * p + + & 1 ;
char const * pat = p ;
p + = strlen ( p ) + 1 ;
successes + = test ( pat , p , expected ) ;
p + = strlen ( p ) + 1 ;
n + + ;
}
n - = successes ;
printk ( message , successes , n ) ;
/* What's the errno for "kernel bug detected"? Guess... */
return n ? - ECANCELED : 0 ;
}
/* We need a dummy exit function to allow unload */
static void __exit glob_fini ( void ) { }
module_init ( glob_init ) ;
module_exit ( glob_fini ) ;
# endif /* CONFIG_GLOB_SELFTEST */