2005-06-23 20:49:30 -07:00
/*
* lib / textsearch . c Generic text search interface
*
* This program is free software ; you can redistribute it and / or
* modify it under the terms of the GNU General Public License
* as published by the Free Software Foundation ; either version
* 2 of the License , or ( at your option ) any later version .
*
* Authors : Thomas Graf < tgraf @ suug . ch >
2007-12-01 00:03:52 +11:00
* Pablo Neira Ayuso < pablo @ netfilter . org >
2005-06-23 20:49:30 -07:00
*
* = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = =
*
* INTRODUCTION
*
* The textsearch infrastructure provides text searching facitilies for
* both linear and non - linear data . Individual search algorithms are
* implemented in modules and chosen by the user .
*
* ARCHITECTURE
*
* User
* + - - - - - - - - - - - - - - - - +
* | finish ( ) | < - - - - - - - - - - - - - - ( 6 ) - - - - - - - - - - - - - - - - - +
* | get_next_block ( ) | < - - - - - - - - - - - - - - ( 5 ) - - - - - - - - - - - - - - - + |
* | | Algorithm | |
* | | + - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - +
* | | | init ( ) find ( ) destroy ( ) |
* | | + - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - +
* | | Core API ^ ^ ^
* | | + - - - - - - - - - - - - - - - + ( 2 ) ( 4 ) ( 8 )
* | ( 1 ) | - - - - - > | prepare ( ) | - - - + | |
* | ( 3 ) | - - - - - > | find ( ) / next ( ) | - - - - - - - - - - - + |
* | ( 7 ) | - - - - - > | destroy ( ) | - - - - - - - - - - - - - - - - - - - - - - +
* + - - - - - - - - - - - - - - - - + + - - - - - - - - - - - - - - - +
*
* ( 1 ) User configures a search by calling _prepare ( ) specifying the
* search parameters such as the pattern and algorithm name .
* ( 2 ) Core requests the algorithm to allocate and initialize a search
* configuration according to the specified parameters .
* ( 3 ) User starts the search ( es ) by calling _find ( ) or _next ( ) to
* fetch subsequent occurrences . A state variable is provided
2007-02-17 19:07:33 +01:00
* to the algorithm to store persistent variables .
2005-06-23 20:49:30 -07:00
* ( 4 ) Core eventually resets the search offset and forwards the find ( )
* request to the algorithm .
* ( 5 ) Algorithm calls get_next_block ( ) provided by the user continously
* to fetch the data to be searched in block by block .
* ( 6 ) Algorithm invokes finish ( ) after the last call to get_next_block
* to clean up any leftovers from get_next_block . ( Optional )
* ( 7 ) User destroys the configuration by calling _destroy ( ) .
* ( 8 ) Core notifies the algorithm to destroy algorithm specific
* allocations . ( Optional )
*
* USAGE
*
* Before a search can be performed , a configuration must be created
2008-07-08 02:37:31 -07:00
* by calling textsearch_prepare ( ) specifying the searching algorithm ,
* the pattern to look for and flags . As a flag , you can set TS_IGNORECASE
* to perform case insensitive matching . But it might slow down
* performance of algorithm , so you should use it at own your risk .
* The returned configuration may then be used for an arbitary
* amount of times and even in parallel as long as a separate struct
* ts_state variable is provided to every instance .
2005-06-23 20:49:30 -07:00
*
* The actual search is performed by either calling textsearch_find_ -
* continuous ( ) for linear data or by providing an own get_next_block ( )
* implementation and calling textsearch_find ( ) . Both functions return
* the position of the first occurrence of the patern or UINT_MAX if
* no match was found . Subsequent occurences can be found by calling
* textsearch_next ( ) regardless of the linearity of the data .
*
* Once you ' re done using a configuration it must be given back via
* textsearch_destroy .
*
* EXAMPLE
*
* int pos ;
* struct ts_config * conf ;
* struct ts_state state ;
* const char * pattern = " chicken " ;
* const char * example = " We dance the funky chicken " ;
*
* conf = textsearch_prepare ( " kmp " , pattern , strlen ( pattern ) ,
* GFP_KERNEL , TS_AUTOLOAD ) ;
* if ( IS_ERR ( conf ) ) {
* err = PTR_ERR ( conf ) ;
* goto errout ;
* }
*
* pos = textsearch_find_continuous ( conf , & state , example , strlen ( example ) ) ;
* if ( pos ! = UINT_MAX )
* panic ( " Oh my god, dancing chickens at %d \n " , pos ) ;
*
* textsearch_destroy ( conf ) ;
* = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = = =
*/
# include <linux/module.h>
# include <linux/types.h>
# include <linux/string.h>
# include <linux/init.h>
2008-05-12 21:21:05 +02:00
# include <linux/rculist.h>
2005-06-23 20:49:30 -07:00
# include <linux/rcupdate.h>
# include <linux/err.h>
# include <linux/textsearch.h>
static LIST_HEAD ( ts_ops ) ;
static DEFINE_SPINLOCK ( ts_mod_lock ) ;
static inline struct ts_ops * lookup_ts_algo ( const char * name )
{
struct ts_ops * o ;
rcu_read_lock ( ) ;
list_for_each_entry_rcu ( o , & ts_ops , list ) {
if ( ! strcmp ( name , o - > name ) ) {
if ( ! try_module_get ( o - > owner ) )
o = NULL ;
rcu_read_unlock ( ) ;
return o ;
}
}
rcu_read_unlock ( ) ;
return NULL ;
}
/**
* textsearch_register - register a textsearch module
* @ ops : operations lookup table
*
* This function must be called by textsearch modules to announce
* their presence . The specified & @ ops must have % name set to a
* unique identifier and the callbacks find ( ) , init ( ) , get_pattern ( ) ,
* and get_pattern_len ( ) must be implemented .
*
* Returns 0 or - EEXISTS if another module has already registered
* with same name .
*/
int textsearch_register ( struct ts_ops * ops )
{
int err = - EEXIST ;
struct ts_ops * o ;
if ( ops - > name = = NULL | | ops - > find = = NULL | | ops - > init = = NULL | |
ops - > get_pattern = = NULL | | ops - > get_pattern_len = = NULL )
return - EINVAL ;
spin_lock ( & ts_mod_lock ) ;
list_for_each_entry ( o , & ts_ops , list ) {
if ( ! strcmp ( ops - > name , o - > name ) )
goto errout ;
}
list_add_tail_rcu ( & ops - > list , & ts_ops ) ;
err = 0 ;
errout :
spin_unlock ( & ts_mod_lock ) ;
return err ;
}
/**
* textsearch_unregister - unregister a textsearch module
* @ ops : operations lookup table
*
* This function must be called by textsearch modules to announce
* their disappearance for examples when the module gets unloaded .
* The & ops parameter must be the same as the one during the
* registration .
*
* Returns 0 on success or - ENOENT if no matching textsearch
* registration was found .
*/
int textsearch_unregister ( struct ts_ops * ops )
{
int err = 0 ;
struct ts_ops * o ;
spin_lock ( & ts_mod_lock ) ;
list_for_each_entry ( o , & ts_ops , list ) {
if ( o = = ops ) {
list_del_rcu ( & o - > list ) ;
goto out ;
}
}
err = - ENOENT ;
out :
spin_unlock ( & ts_mod_lock ) ;
return err ;
}
struct ts_linear_state
{
unsigned int len ;
const void * data ;
} ;
static unsigned int get_linear_data ( unsigned int consumed , const u8 * * dst ,
struct ts_config * conf ,
struct ts_state * state )
{
struct ts_linear_state * st = ( struct ts_linear_state * ) state - > cb ;
if ( likely ( consumed < st - > len ) ) {
* dst = st - > data + consumed ;
return st - > len - consumed ;
}
return 0 ;
}
/**
* textsearch_find_continuous - search a pattern in continuous / linear data
* @ conf : search configuration
* @ state : search state
* @ data : data to search in
* @ len : length of data
*
* A simplified version of textsearch_find ( ) for continuous / linear data .
* Call textsearch_next ( ) to retrieve subsequent matches .
*
* Returns the position of first occurrence of the pattern or
2007-02-10 01:45:59 -08:00
* % UINT_MAX if no occurrence was found .
2005-06-23 20:49:30 -07:00
*/
unsigned int textsearch_find_continuous ( struct ts_config * conf ,
struct ts_state * state ,
const void * data , unsigned int len )
{
struct ts_linear_state * st = ( struct ts_linear_state * ) state - > cb ;
conf - > get_next_block = get_linear_data ;
st - > data = data ;
st - > len = len ;
return textsearch_find ( conf , state ) ;
}
/**
* textsearch_prepare - Prepare a search
* @ algo : name of search algorithm
* @ pattern : pattern data
* @ len : length of pattern
* @ gfp_mask : allocation mask
* @ flags : search flags
*
* Looks up the search algorithm module and creates a new textsearch
* configuration for the specified pattern . Upon completion all
* necessary refcnts are held and the configuration must be put back
* using textsearch_put ( ) after usage .
*
* Note : The format of the pattern may not be compatible between
* the various search algorithms .
*
* Returns a new textsearch configuration according to the specified
2007-12-01 00:03:52 +11:00
* parameters or a ERR_PTR ( ) . If a zero length pattern is passed , this
* function returns EINVAL .
2005-06-23 20:49:30 -07:00
*/
struct ts_config * textsearch_prepare ( const char * algo , const void * pattern ,
2005-10-21 03:18:50 -04:00
unsigned int len , gfp_t gfp_mask , int flags )
2005-06-23 20:49:30 -07:00
{
int err = - ENOENT ;
struct ts_config * conf ;
struct ts_ops * ops ;
2007-12-01 00:03:52 +11:00
if ( len = = 0 )
return ERR_PTR ( - EINVAL ) ;
2005-06-23 20:49:30 -07:00
ops = lookup_ts_algo ( algo ) ;
2008-07-08 19:00:24 +02:00
# ifdef CONFIG_MODULES
2005-06-23 20:49:30 -07:00
/*
* Why not always autoload you may ask . Some users are
* in a situation where requesting a module may deadlock ,
* especially when the module is located on a NFS mount .
*/
if ( ops = = NULL & & flags & TS_AUTOLOAD ) {
request_module ( " ts_%s " , algo ) ;
ops = lookup_ts_algo ( algo ) ;
}
# endif
if ( ops = = NULL )
goto errout ;
2008-07-08 02:37:31 -07:00
conf = ops - > init ( pattern , len , gfp_mask , flags ) ;
2005-06-23 20:49:30 -07:00
if ( IS_ERR ( conf ) ) {
err = PTR_ERR ( conf ) ;
goto errout ;
}
conf - > ops = ops ;
return conf ;
errout :
if ( ops )
module_put ( ops - > owner ) ;
return ERR_PTR ( err ) ;
}
/**
* textsearch_destroy - destroy a search configuration
* @ conf : search configuration
*
* Releases all references of the configuration and frees
* up the memory .
*/
void textsearch_destroy ( struct ts_config * conf )
{
if ( conf - > ops ) {
if ( conf - > ops - > destroy )
conf - > ops - > destroy ( conf ) ;
module_put ( conf - > ops - > owner ) ;
}
kfree ( conf ) ;
}
EXPORT_SYMBOL ( textsearch_register ) ;
EXPORT_SYMBOL ( textsearch_unregister ) ;
EXPORT_SYMBOL ( textsearch_prepare ) ;
EXPORT_SYMBOL ( textsearch_find_continuous ) ;
EXPORT_SYMBOL ( textsearch_destroy ) ;