2019-06-04 11:11:15 +03:00
// SPDX-License-Identifier: GPL-2.0-only
2011-05-26 20:01:36 +04:00
/*
* Cleancache frontend
*
* This code provides the generic " frontend " layer to call a matching
* " backend " driver implementation of cleancache . See
2018-03-21 22:22:47 +03:00
* Documentation / vm / cleancache . rst for more information .
2011-05-26 20:01:36 +04:00
*
* Copyright ( C ) 2009 - 2010 Oracle Corp . All rights reserved .
* Author : Dan Magenheimer
*/
# include <linux/module.h>
# include <linux/fs.h>
# include <linux/exportfs.h>
# include <linux/mm.h>
2011-09-21 20:28:04 +04:00
# include <linux/debugfs.h>
2011-05-26 20:01:36 +04:00
# include <linux/cleancache.h>
/*
2015-04-15 01:46:48 +03:00
* cleancache_ops is set by cleancache_register_ops to contain the pointers
2011-05-26 20:01:36 +04:00
* to the cleancache " backend " implementation functions .
*/
2016-01-21 18:47:29 +03:00
static const struct cleancache_ops * cleancache_ops __read_mostly ;
2011-05-26 20:01:36 +04:00
2011-09-21 20:28:04 +04:00
/*
2015-01-07 13:14:41 +03:00
* Counters available via / sys / kernel / debug / cleancache ( if debugfs is
2011-09-21 20:28:04 +04:00
* properly configured . These are for information only so are not protected
* against increment races .
*/
static u64 cleancache_succ_gets ;
static u64 cleancache_failed_gets ;
static u64 cleancache_puts ;
static u64 cleancache_invalidates ;
2011-05-26 20:01:36 +04:00
2015-04-15 01:46:48 +03:00
static void cleancache_register_ops_sb ( struct super_block * sb , void * unused )
{
switch ( sb - > cleancache_poolid ) {
case CLEANCACHE_NO_BACKEND :
__cleancache_init_fs ( sb ) ;
break ;
case CLEANCACHE_NO_BACKEND_SHARED :
__cleancache_init_shared_fs ( sb ) ;
break ;
}
}
2013-05-01 02:26:56 +04:00
/*
cleancache: forbid overriding cleancache_ops
Currently, cleancache_register_ops returns the previous value of
cleancache_ops to allow chaining. However, chaining, as it is
implemented now, is extremely dangerous due to possible pool id
collisions. Suppose, a new cleancache driver is registered after the
previous one assigned an id to a super block. If the new driver assigns
the same id to another super block, which is perfectly possible, we will
have two different filesystems using the same id. No matter if the new
driver implements chaining or not, we are likely to get data corruption
with such a configuration eventually.
This patch therefore disables the ability to override cleancache_ops
altogether as potentially dangerous. If there is already cleancache
driver registered, all further calls to cleancache_register_ops will
return EBUSY. Since no user of cleancache implements chaining, we only
need to make minor changes to the code outside the cleancache core.
Signed-off-by: Vladimir Davydov <vdavydov@parallels.com>
Cc: Konrad Rzeszutek Wilk <konrad.wilk@oracle.com>
Cc: Boris Ostrovsky <boris.ostrovsky@oracle.com>
Cc: David Vrabel <david.vrabel@citrix.com>
Cc: Mark Fasheh <mfasheh@suse.com>
Cc: Joel Becker <jlbec@evilplan.org>
Cc: Stefan Hengelein <ilendir@googlemail.com>
Cc: Florian Schmaus <fschmaus@gmail.com>
Cc: Andor Daam <andor.daam@googlemail.com>
Cc: Dan Magenheimer <dan.magenheimer@oracle.com>
Cc: Bob Liu <lliubbo@gmail.com>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2015-04-15 01:46:45 +03:00
* Register operations for cleancache . Returns 0 on success .
2011-05-26 20:01:36 +04:00
*/
2016-01-21 18:47:29 +03:00
int cleancache_register_ops ( const struct cleancache_ops * ops )
2011-05-26 20:01:36 +04:00
{
2015-04-15 01:46:48 +03:00
if ( cmpxchg ( & cleancache_ops , NULL , ops ) )
cleancache: forbid overriding cleancache_ops
Currently, cleancache_register_ops returns the previous value of
cleancache_ops to allow chaining. However, chaining, as it is
implemented now, is extremely dangerous due to possible pool id
collisions. Suppose, a new cleancache driver is registered after the
previous one assigned an id to a super block. If the new driver assigns
the same id to another super block, which is perfectly possible, we will
have two different filesystems using the same id. No matter if the new
driver implements chaining or not, we are likely to get data corruption
with such a configuration eventually.
This patch therefore disables the ability to override cleancache_ops
altogether as potentially dangerous. If there is already cleancache
driver registered, all further calls to cleancache_register_ops will
return EBUSY. Since no user of cleancache implements chaining, we only
need to make minor changes to the code outside the cleancache core.
Signed-off-by: Vladimir Davydov <vdavydov@parallels.com>
Cc: Konrad Rzeszutek Wilk <konrad.wilk@oracle.com>
Cc: Boris Ostrovsky <boris.ostrovsky@oracle.com>
Cc: David Vrabel <david.vrabel@citrix.com>
Cc: Mark Fasheh <mfasheh@suse.com>
Cc: Joel Becker <jlbec@evilplan.org>
Cc: Stefan Hengelein <ilendir@googlemail.com>
Cc: Florian Schmaus <fschmaus@gmail.com>
Cc: Andor Daam <andor.daam@googlemail.com>
Cc: Dan Magenheimer <dan.magenheimer@oracle.com>
Cc: Bob Liu <lliubbo@gmail.com>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2015-04-15 01:46:45 +03:00
return - EBUSY ;
2015-04-15 01:46:48 +03:00
2013-05-01 02:26:57 +04:00
/*
2015-04-15 01:46:48 +03:00
* A cleancache backend can be built as a module and hence loaded after
* a cleancache enabled filesystem has called cleancache_init_fs . To
* handle such a scenario , here we call - > init_fs or - > init_shared_fs
* for each active super block . To differentiate between local and
* shared filesystems , we temporarily initialize sb - > cleancache_poolid
* to CLEANCACHE_NO_BACKEND or CLEANCACHE_NO_BACKEND_SHARED
* respectively in case there is no backend registered at the time
* cleancache_init_fs or cleancache_init_shared_fs is called .
*
* Since filesystems can be mounted concurrently with cleancache
* backend registration , we have to be careful to guarantee that all
* cleancache enabled filesystems that has been mounted by the time
* cleancache_register_ops is called has got and all mounted later will
* get cleancache_poolid . This is assured by the following statements
* tied together :
*
* a ) iterate_supers skips only those super blocks that has started
* - > kill_sb
*
* b ) if iterate_supers encounters a super block that has not finished
* - > mount yet , it waits until it is finished
*
* c ) cleancache_init_fs is called from - > mount and
* cleancache_invalidate_fs is called from - > kill_sb
*
* d ) we call iterate_supers after cleancache_ops has been set
*
* From a ) it follows that if iterate_supers skips a super block , then
* either the super block is already dead , in which case we do not need
* to bother initializing cleancache for it , or it was mounted after we
* initiated iterate_supers . In the latter case , it must have seen
* cleancache_ops set according to d ) and initialized cleancache from
* - > mount by itself according to c ) . This proves that we call
* - > init_fs at least once for each active super block .
*
* From b ) and c ) it follows that if iterate_supers encounters a super
* block that has already started - > init_fs , it will wait until - > mount
* and hence - > init_fs has finished , then check cleancache_poolid , see
* that it has already been set and therefore do nothing . This proves
* that we call - > init_fs no more than once for each super block .
*
* Combined together , the last two paragraphs prove the function
* correctness .
*
* Note that various cleancache callbacks may proceed before this
* function is called or even concurrently with it , but since
* CLEANCACHE_NO_BACKEND is negative , they will all result in a noop
* until the corresponding - > init_fs has been actually called and
* cleancache_ops has been set .
2013-05-01 02:26:57 +04:00
*/
2015-04-15 01:46:48 +03:00
iterate_supers ( cleancache_register_ops_sb , NULL ) ;
cleancache: forbid overriding cleancache_ops
Currently, cleancache_register_ops returns the previous value of
cleancache_ops to allow chaining. However, chaining, as it is
implemented now, is extremely dangerous due to possible pool id
collisions. Suppose, a new cleancache driver is registered after the
previous one assigned an id to a super block. If the new driver assigns
the same id to another super block, which is perfectly possible, we will
have two different filesystems using the same id. No matter if the new
driver implements chaining or not, we are likely to get data corruption
with such a configuration eventually.
This patch therefore disables the ability to override cleancache_ops
altogether as potentially dangerous. If there is already cleancache
driver registered, all further calls to cleancache_register_ops will
return EBUSY. Since no user of cleancache implements chaining, we only
need to make minor changes to the code outside the cleancache core.
Signed-off-by: Vladimir Davydov <vdavydov@parallels.com>
Cc: Konrad Rzeszutek Wilk <konrad.wilk@oracle.com>
Cc: Boris Ostrovsky <boris.ostrovsky@oracle.com>
Cc: David Vrabel <david.vrabel@citrix.com>
Cc: Mark Fasheh <mfasheh@suse.com>
Cc: Joel Becker <jlbec@evilplan.org>
Cc: Stefan Hengelein <ilendir@googlemail.com>
Cc: Florian Schmaus <fschmaus@gmail.com>
Cc: Andor Daam <andor.daam@googlemail.com>
Cc: Dan Magenheimer <dan.magenheimer@oracle.com>
Cc: Bob Liu <lliubbo@gmail.com>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2015-04-15 01:46:45 +03:00
return 0 ;
2011-05-26 20:01:36 +04:00
}
EXPORT_SYMBOL ( cleancache_register_ops ) ;
/* Called by a cleancache-enabled filesystem at time of mount */
void __cleancache_init_fs ( struct super_block * sb )
{
2015-04-15 01:46:48 +03:00
int pool_id = CLEANCACHE_NO_BACKEND ;
2013-05-01 02:26:56 +04:00
2015-04-15 01:46:48 +03:00
if ( cleancache_ops ) {
pool_id = cleancache_ops - > init_fs ( PAGE_SIZE ) ;
if ( pool_id < 0 )
pool_id = CLEANCACHE_NO_POOL ;
2013-05-01 02:26:56 +04:00
}
2015-04-15 01:46:48 +03:00
sb - > cleancache_poolid = pool_id ;
2011-05-26 20:01:36 +04:00
}
EXPORT_SYMBOL ( __cleancache_init_fs ) ;
/* Called by a cleancache-enabled clustered filesystem at time of mount */
2015-04-15 01:46:42 +03:00
void __cleancache_init_shared_fs ( struct super_block * sb )
2011-05-26 20:01:36 +04:00
{
2015-04-15 01:46:48 +03:00
int pool_id = CLEANCACHE_NO_BACKEND_SHARED ;
2013-05-01 02:26:56 +04:00
2015-04-15 01:46:48 +03:00
if ( cleancache_ops ) {
2017-05-10 16:06:33 +03:00
pool_id = cleancache_ops - > init_shared_fs ( & sb - > s_uuid , PAGE_SIZE ) ;
2015-04-15 01:46:48 +03:00
if ( pool_id < 0 )
pool_id = CLEANCACHE_NO_POOL ;
2013-05-01 02:26:56 +04:00
}
2015-04-15 01:46:48 +03:00
sb - > cleancache_poolid = pool_id ;
2011-05-26 20:01:36 +04:00
}
EXPORT_SYMBOL ( __cleancache_init_shared_fs ) ;
/*
* If the filesystem uses exportable filehandles , use the filehandle as
* the key , else use the inode number .
*/
static int cleancache_get_key ( struct inode * inode ,
struct cleancache_filekey * key )
{
2012-04-02 22:34:06 +04:00
int ( * fhfn ) ( struct inode * , __u32 * fh , int * , struct inode * ) ;
2011-05-26 20:01:36 +04:00
int len = 0 , maxlen = CLEANCACHE_KEY_MAX ;
struct super_block * sb = inode - > i_sb ;
key - > u . ino = inode - > i_ino ;
if ( sb - > s_export_op ! = NULL ) {
fhfn = sb - > s_export_op - > encode_fh ;
if ( fhfn ) {
2012-04-02 22:34:06 +04:00
len = ( * fhfn ) ( inode , & key - > u . fh [ 0 ] , & maxlen , NULL ) ;
2013-02-17 10:48:11 +04:00
if ( len < = FILEID_ROOT | | len = = FILEID_INVALID )
2011-05-26 20:01:36 +04:00
return - 1 ;
if ( maxlen > CLEANCACHE_KEY_MAX )
return - 1 ;
}
}
return 0 ;
}
/*
* " Get " data from cleancache associated with the poolid / inode / index
* that were specified when the data was put to cleanache and , if
* successful , use it to fill the specified page with data and return 0.
* The pageframe is unchanged and returns - 1 if the get fails .
* Page must be locked by caller .
2013-05-01 02:26:56 +04:00
*
* The function has two checks before any action is taken - whether
* a backend is registered and whether the sb - > cleancache_poolid
* is correct .
2011-05-26 20:01:36 +04:00
*/
int __cleancache_get_page ( struct page * page )
{
int ret = - 1 ;
int pool_id ;
struct cleancache_filekey key = { . u . key = { 0 } } ;
2013-05-01 02:26:57 +04:00
if ( ! cleancache_ops ) {
2013-05-01 02:26:56 +04:00
cleancache_failed_gets + + ;
goto out ;
}
2014-01-24 03:52:54 +04:00
VM_BUG_ON_PAGE ( ! PageLocked ( page ) , page ) ;
2015-04-15 01:46:48 +03:00
pool_id = page - > mapping - > host - > i_sb - > cleancache_poolid ;
if ( pool_id < 0 )
2011-05-26 20:01:36 +04:00
goto out ;
if ( cleancache_get_key ( page - > mapping - > host , & key ) < 0 )
goto out ;
2015-04-15 01:46:48 +03:00
ret = cleancache_ops - > get_page ( pool_id , key , page - > index , page ) ;
2011-05-26 20:01:36 +04:00
if ( ret = = 0 )
cleancache_succ_gets + + ;
else
cleancache_failed_gets + + ;
out :
return ret ;
}
EXPORT_SYMBOL ( __cleancache_get_page ) ;
/*
* " Put " data from a page to cleancache and associate it with the
* ( previously - obtained per - filesystem ) poolid and the page ' s ,
* inode and page index . Page must be locked . Note that a put_page
* always " succeeds " , though a subsequent get_page may succeed or fail .
2013-05-01 02:26:56 +04:00
*
* The function has two checks before any action is taken - whether
* a backend is registered and whether the sb - > cleancache_poolid
* is correct .
2011-05-26 20:01:36 +04:00
*/
void __cleancache_put_page ( struct page * page )
{
int pool_id ;
struct cleancache_filekey key = { . u . key = { 0 } } ;
2013-05-01 02:26:57 +04:00
if ( ! cleancache_ops ) {
2013-05-01 02:26:56 +04:00
cleancache_puts + + ;
return ;
}
2014-01-24 03:52:54 +04:00
VM_BUG_ON_PAGE ( ! PageLocked ( page ) , page ) ;
2015-04-15 01:46:48 +03:00
pool_id = page - > mapping - > host - > i_sb - > cleancache_poolid ;
2011-05-26 20:01:36 +04:00
if ( pool_id > = 0 & &
2013-05-01 02:26:56 +04:00
cleancache_get_key ( page - > mapping - > host , & key ) > = 0 ) {
2013-05-01 02:26:57 +04:00
cleancache_ops - > put_page ( pool_id , key , page - > index , page ) ;
2011-05-26 20:01:36 +04:00
cleancache_puts + + ;
}
}
EXPORT_SYMBOL ( __cleancache_put_page ) ;
/*
2011-09-21 19:56:28 +04:00
* Invalidate any data from cleancache associated with the poolid and the
2011-05-26 20:01:36 +04:00
* page ' s inode and page index so that a subsequent " get " will fail .
2013-05-01 02:26:56 +04:00
*
* The function has two checks before any action is taken - whether
* a backend is registered and whether the sb - > cleancache_poolid
* is correct .
2011-05-26 20:01:36 +04:00
*/
2011-09-21 19:56:28 +04:00
void __cleancache_invalidate_page ( struct address_space * mapping ,
struct page * page )
2011-05-26 20:01:36 +04:00
{
/* careful... page->mapping is NULL sometimes when this is called */
2015-04-15 01:46:48 +03:00
int pool_id = mapping - > host - > i_sb - > cleancache_poolid ;
2011-05-26 20:01:36 +04:00
struct cleancache_filekey key = { . u . key = { 0 } } ;
2013-05-01 02:26:57 +04:00
if ( ! cleancache_ops )
2013-05-01 02:26:56 +04:00
return ;
2015-04-15 01:46:48 +03:00
if ( pool_id > = 0 ) {
2014-01-24 03:52:54 +04:00
VM_BUG_ON_PAGE ( ! PageLocked ( page ) , page ) ;
2011-05-26 20:01:36 +04:00
if ( cleancache_get_key ( mapping - > host , & key ) > = 0 ) {
2013-05-01 02:26:57 +04:00
cleancache_ops - > invalidate_page ( pool_id ,
2013-05-01 02:26:56 +04:00
key , page - > index ) ;
2011-09-21 20:28:04 +04:00
cleancache_invalidates + + ;
2011-05-26 20:01:36 +04:00
}
}
}
2011-09-21 19:56:28 +04:00
EXPORT_SYMBOL ( __cleancache_invalidate_page ) ;
2011-05-26 20:01:36 +04:00
/*
2011-09-21 19:56:28 +04:00
* Invalidate all data from cleancache associated with the poolid and the
2011-05-26 20:01:36 +04:00
* mappings ' s inode so that all subsequent gets to this poolid / inode
* will fail .
2013-05-01 02:26:56 +04:00
*
* The function has two checks before any action is taken - whether
* a backend is registered and whether the sb - > cleancache_poolid
* is correct .
2011-05-26 20:01:36 +04:00
*/
2011-09-21 19:56:28 +04:00
void __cleancache_invalidate_inode ( struct address_space * mapping )
2011-05-26 20:01:36 +04:00
{
2015-04-15 01:46:48 +03:00
int pool_id = mapping - > host - > i_sb - > cleancache_poolid ;
2011-05-26 20:01:36 +04:00
struct cleancache_filekey key = { . u . key = { 0 } } ;
2013-05-01 02:26:57 +04:00
if ( ! cleancache_ops )
2013-05-01 02:26:56 +04:00
return ;
2011-05-26 20:01:36 +04:00
if ( pool_id > = 0 & & cleancache_get_key ( mapping - > host , & key ) > = 0 )
2013-05-01 02:26:57 +04:00
cleancache_ops - > invalidate_inode ( pool_id , key ) ;
2011-05-26 20:01:36 +04:00
}
2011-09-21 19:56:28 +04:00
EXPORT_SYMBOL ( __cleancache_invalidate_inode ) ;
2011-05-26 20:01:36 +04:00
/*
* Called by any cleancache - enabled filesystem at time of unmount ;
2013-05-01 02:26:56 +04:00
* note that pool_id is surrendered and may be returned by a subsequent
* cleancache_init_fs or cleancache_init_shared_fs .
2011-05-26 20:01:36 +04:00
*/
2011-09-21 19:56:28 +04:00
void __cleancache_invalidate_fs ( struct super_block * sb )
2011-05-26 20:01:36 +04:00
{
2015-04-15 01:46:48 +03:00
int pool_id ;
2013-05-01 02:26:56 +04:00
2015-04-15 01:46:48 +03:00
pool_id = sb - > cleancache_poolid ;
sb - > cleancache_poolid = CLEANCACHE_NO_POOL ;
if ( cleancache_ops & & pool_id > = 0 )
cleancache_ops - > invalidate_fs ( pool_id ) ;
2011-05-26 20:01:36 +04:00
}
2011-09-21 19:56:28 +04:00
EXPORT_SYMBOL ( __cleancache_invalidate_fs ) ;
2011-05-26 20:01:36 +04:00
static int __init init_cleancache ( void )
{
2011-09-21 20:28:04 +04:00
# ifdef CONFIG_DEBUG_FS
struct dentry * root = debugfs_create_dir ( " cleancache " , NULL ) ;
2019-01-22 18:21:11 +03:00
2018-06-15 01:27:58 +03:00
debugfs_create_u64 ( " succ_gets " , 0444 , root , & cleancache_succ_gets ) ;
debugfs_create_u64 ( " failed_gets " , 0444 , root , & cleancache_failed_gets ) ;
debugfs_create_u64 ( " puts " , 0444 , root , & cleancache_puts ) ;
debugfs_create_u64 ( " invalidates " , 0444 , root , & cleancache_invalidates ) ;
2011-09-21 20:28:04 +04:00
# endif
2011-05-26 20:01:36 +04:00
return 0 ;
}
module_init ( init_cleancache )