2005-04-16 15:20:36 -07:00
/*
* file . c - operations for regular ( text ) files .
*/
# include <linux/module.h>
[PATCH] inotify
inotify is intended to correct the deficiencies of dnotify, particularly
its inability to scale and its terrible user interface:
* dnotify requires the opening of one fd per each directory
that you intend to watch. This quickly results in too many
open files and pins removable media, preventing unmount.
* dnotify is directory-based. You only learn about changes to
directories. Sure, a change to a file in a directory affects
the directory, but you are then forced to keep a cache of
stat structures.
* dnotify's interface to user-space is awful. Signals?
inotify provides a more usable, simple, powerful solution to file change
notification:
* inotify's interface is a system call that returns a fd, not SIGIO.
You get a single fd, which is select()-able.
* inotify has an event that says "the filesystem that the item
you were watching is on was unmounted."
* inotify can watch directories or files.
Inotify is currently used by Beagle (a desktop search infrastructure),
Gamin (a FAM replacement), and other projects.
See Documentation/filesystems/inotify.txt.
Signed-off-by: Robert Love <rml@novell.com>
Cc: John McCutchan <ttb@tentacle.dhs.org>
Cc: Christoph Hellwig <hch@lst.de>
Signed-off-by: Andrew Morton <akpm@osdl.org>
Signed-off-by: Linus Torvalds <torvalds@osdl.org>
2005-07-12 17:06:03 -04:00
# include <linux/fsnotify.h>
2005-04-16 15:20:36 -07:00
# include <linux/kobject.h>
2005-06-23 00:09:12 -07:00
# include <linux/namei.h>
2006-03-20 17:53:53 +11:00
# include <linux/poll.h>
2005-04-16 15:20:36 -07:00
# include <asm/uaccess.h>
# include <asm/semaphore.h>
# include "sysfs.h"
# define to_subsys(k) container_of(k,struct subsystem,kset.kobj)
# define to_sattr(a) container_of(a,struct subsys_attribute,attr)
2005-06-23 22:05:21 -07:00
/*
2005-04-16 15:20:36 -07:00
* Subsystem file operations .
* These operations allow subsystems to have files that can be
* read / written .
*/
static ssize_t
subsys_attr_show ( struct kobject * kobj , struct attribute * attr , char * page )
{
struct subsystem * s = to_subsys ( kobj ) ;
struct subsys_attribute * sattr = to_sattr ( attr ) ;
2005-04-29 01:22:00 -05:00
ssize_t ret = - EIO ;
2005-04-16 15:20:36 -07:00
if ( sattr - > show )
ret = sattr - > show ( s , page ) ;
return ret ;
}
static ssize_t
subsys_attr_store ( struct kobject * kobj , struct attribute * attr ,
const char * page , size_t count )
{
struct subsystem * s = to_subsys ( kobj ) ;
struct subsys_attribute * sattr = to_sattr ( attr ) ;
2005-04-29 01:22:00 -05:00
ssize_t ret = - EIO ;
2005-04-16 15:20:36 -07:00
if ( sattr - > store )
ret = sattr - > store ( s , page , count ) ;
return ret ;
}
static struct sysfs_ops subsys_sysfs_ops = {
. show = subsys_attr_show ,
. store = subsys_attr_store ,
} ;
struct sysfs_buffer {
size_t count ;
loff_t pos ;
char * page ;
struct sysfs_ops * ops ;
struct semaphore sem ;
int needs_read_fill ;
2006-03-20 17:53:53 +11:00
int event ;
2005-04-16 15:20:36 -07:00
} ;
/**
* fill_read_buffer - allocate and fill buffer from object .
* @ dentry : dentry pointer .
* @ buffer : data buffer for file .
*
* Allocate @ buffer - > page , if it hasn ' t been already , then call the
* kobject ' s show ( ) method to fill the buffer with this attribute ' s
* data .
* This is called only once , on the file ' s first read .
*/
static int fill_read_buffer ( struct dentry * dentry , struct sysfs_buffer * buffer )
{
2006-03-20 17:53:53 +11:00
struct sysfs_dirent * sd = dentry - > d_fsdata ;
2005-04-16 15:20:36 -07:00
struct attribute * attr = to_attr ( dentry ) ;
struct kobject * kobj = to_kobj ( dentry - > d_parent ) ;
struct sysfs_ops * ops = buffer - > ops ;
int ret = 0 ;
ssize_t count ;
if ( ! buffer - > page )
buffer - > page = ( char * ) get_zeroed_page ( GFP_KERNEL ) ;
if ( ! buffer - > page )
return - ENOMEM ;
2006-03-20 17:53:53 +11:00
buffer - > event = atomic_read ( & sd - > s_event ) ;
2005-04-16 15:20:36 -07:00
count = ops - > show ( kobj , attr , buffer - > page ) ;
buffer - > needs_read_fill = 0 ;
BUG_ON ( count > ( ssize_t ) PAGE_SIZE ) ;
if ( count > = 0 )
buffer - > count = count ;
else
ret = count ;
return ret ;
}
/**
* flush_read_buffer - push buffer to userspace .
* @ buffer : data buffer for file .
2005-05-01 08:59:26 -07:00
* @ buf : user - passed buffer .
2005-04-16 15:20:36 -07:00
* @ count : number of bytes requested .
* @ ppos : file position .
*
* Copy the buffer we filled in fill_read_buffer ( ) to userspace .
* This is done at the reader ' s leisure , copying and advancing
* the amount they specify each time .
* This may be called continuously until the buffer is empty .
*/
static int flush_read_buffer ( struct sysfs_buffer * buffer , char __user * buf ,
size_t count , loff_t * ppos )
{
int error ;
if ( * ppos > buffer - > count )
return 0 ;
if ( count > ( buffer - > count - * ppos ) )
count = buffer - > count - * ppos ;
error = copy_to_user ( buf , buffer - > page + * ppos , count ) ;
if ( ! error )
* ppos + = count ;
return error ? - EFAULT : count ;
}
/**
* sysfs_read_file - read an attribute .
* @ file : file pointer .
* @ buf : buffer to fill .
* @ count : number of bytes to read .
* @ ppos : starting offset in file .
*
* Userspace wants to read an attribute file . The attribute descriptor
* is in the file ' s - > d_fsdata . The target object is in the directory ' s
* - > d_fsdata .
*
* We call fill_read_buffer ( ) to allocate and fill the buffer from the
* object ' s show ( ) method exactly once ( if the read is happening from
* the beginning of the file ) . That should fill the entire buffer with
* all the data the object has to offer for that attribute .
* We then call flush_read_buffer ( ) to copy the buffer to userspace
* in the increments specified .
*/
static ssize_t
sysfs_read_file ( struct file * file , char __user * buf , size_t count , loff_t * ppos )
{
struct sysfs_buffer * buffer = file - > private_data ;
ssize_t retval = 0 ;
down ( & buffer - > sem ) ;
if ( buffer - > needs_read_fill ) {
if ( ( retval = fill_read_buffer ( file - > f_dentry , buffer ) ) )
goto out ;
}
2006-10-03 01:16:06 -07:00
pr_debug ( " %s: count = %zd, ppos = %lld, buf = %s \n " ,
__FUNCTION__ , count , * ppos , buffer - > page ) ;
2005-04-16 15:20:36 -07:00
retval = flush_read_buffer ( buffer , buf , count , ppos ) ;
out :
up ( & buffer - > sem ) ;
return retval ;
}
/**
* fill_write_buffer - copy buffer from userspace .
* @ buffer : data buffer for file .
2005-05-01 08:59:26 -07:00
* @ buf : data from user .
2005-04-16 15:20:36 -07:00
* @ count : number of bytes in @ userbuf .
*
* Allocate @ buffer - > page if it hasn ' t been already , then
* copy the user - supplied buffer into it .
*/
static int
fill_write_buffer ( struct sysfs_buffer * buffer , const char __user * buf , size_t count )
{
int error ;
if ( ! buffer - > page )
buffer - > page = ( char * ) get_zeroed_page ( GFP_KERNEL ) ;
if ( ! buffer - > page )
return - ENOMEM ;
if ( count > = PAGE_SIZE )
2006-03-31 15:37:06 -08:00
count = PAGE_SIZE - 1 ;
2005-04-16 15:20:36 -07:00
error = copy_from_user ( buffer - > page , buf , count ) ;
buffer - > needs_read_fill = 1 ;
2006-10-22 19:17:47 +02:00
/* if buf is assumed to contain a string, terminate it by \0,
so e . g . sscanf ( ) can scan the string easily */
buffer - > page [ count ] = 0 ;
2005-04-16 15:20:36 -07:00
return error ? - EFAULT : count ;
}
/**
* flush_write_buffer - push buffer to kobject .
2005-06-23 22:05:21 -07:00
* @ dentry : dentry to the attribute
2005-04-16 15:20:36 -07:00
* @ buffer : data buffer for file .
2005-06-23 22:05:21 -07:00
* @ count : number of bytes
2005-04-16 15:20:36 -07:00
*
* Get the correct pointers for the kobject and the attribute we ' re
* dealing with , then call the store ( ) method for the attribute ,
* passing the buffer that we acquired in fill_write_buffer ( ) .
*/
static int
flush_write_buffer ( struct dentry * dentry , struct sysfs_buffer * buffer , size_t count )
{
struct attribute * attr = to_attr ( dentry ) ;
struct kobject * kobj = to_kobj ( dentry - > d_parent ) ;
struct sysfs_ops * ops = buffer - > ops ;
return ops - > store ( kobj , attr , buffer - > page , count ) ;
}
/**
* sysfs_write_file - write an attribute .
* @ file : file pointer
* @ buf : data to write
* @ count : number of bytes
* @ ppos : starting offset
*
* Similar to sysfs_read_file ( ) , though working in the opposite direction .
* We allocate and fill the data from the user in fill_write_buffer ( ) ,
* then push it to the kobject in flush_write_buffer ( ) .
* There is no easy way for us to know if userspace is only doing a partial
* write , so we don ' t support them . We expect the entire buffer to come
* on the first write .
* Hint : if you ' re writing a value , first read the file , modify only the
* the value you ' re changing , then write entire buffer back .
*/
static ssize_t
sysfs_write_file ( struct file * file , const char __user * buf , size_t count , loff_t * ppos )
{
struct sysfs_buffer * buffer = file - > private_data ;
ssize_t len ;
down ( & buffer - > sem ) ;
len = fill_write_buffer ( buffer , buf , count ) ;
if ( len > 0 )
len = flush_write_buffer ( file - > f_dentry , buffer , len ) ;
if ( len > 0 )
* ppos + = len ;
up ( & buffer - > sem ) ;
return len ;
}
static int check_perm ( struct inode * inode , struct file * file )
{
struct kobject * kobj = sysfs_get_kobject ( file - > f_dentry - > d_parent ) ;
struct attribute * attr = to_attr ( file - > f_dentry ) ;
struct sysfs_buffer * buffer ;
struct sysfs_ops * ops = NULL ;
int error = 0 ;
if ( ! kobj | | ! attr )
goto Einval ;
/* Grab the module reference for this attribute if we have one */
if ( ! try_module_get ( attr - > owner ) ) {
error = - ENODEV ;
goto Done ;
}
/* if the kobject has no ktype, then we assume that it is a subsystem
* itself , and use ops for it .
*/
if ( kobj - > kset & & kobj - > kset - > ktype )
ops = kobj - > kset - > ktype - > sysfs_ops ;
else if ( kobj - > ktype )
ops = kobj - > ktype - > sysfs_ops ;
else
ops = & subsys_sysfs_ops ;
/* No sysfs operations, either from having no subsystem,
* or the subsystem have no operations .
*/
if ( ! ops )
goto Eaccess ;
/* File needs write support.
* The inode ' s perms must say it ' s ok ,
* and we must have a store method .
*/
if ( file - > f_mode & FMODE_WRITE ) {
if ( ! ( inode - > i_mode & S_IWUGO ) | | ! ops - > store )
goto Eaccess ;
}
/* File needs read support.
* The inode ' s perms must say it ' s ok , and we there
* must be a show method for it .
*/
if ( file - > f_mode & FMODE_READ ) {
if ( ! ( inode - > i_mode & S_IRUGO ) | | ! ops - > show )
goto Eaccess ;
}
/* No error? Great, allocate a buffer for the file, and store it
* it in file - > private_data for easy access .
*/
2006-02-22 11:18:15 +01:00
buffer = kzalloc ( sizeof ( struct sysfs_buffer ) , GFP_KERNEL ) ;
2005-04-16 15:20:36 -07:00
if ( buffer ) {
init_MUTEX ( & buffer - > sem ) ;
buffer - > needs_read_fill = 1 ;
buffer - > ops = ops ;
file - > private_data = buffer ;
} else
error = - ENOMEM ;
goto Done ;
Einval :
error = - EINVAL ;
goto Done ;
Eaccess :
error = - EACCES ;
module_put ( attr - > owner ) ;
Done :
if ( error & & kobj )
kobject_put ( kobj ) ;
return error ;
}
static int sysfs_open_file ( struct inode * inode , struct file * filp )
{
return check_perm ( inode , filp ) ;
}
static int sysfs_release ( struct inode * inode , struct file * filp )
{
struct kobject * kobj = to_kobj ( filp - > f_dentry - > d_parent ) ;
struct attribute * attr = to_attr ( filp - > f_dentry ) ;
struct module * owner = attr - > owner ;
struct sysfs_buffer * buffer = filp - > private_data ;
if ( kobj )
kobject_put ( kobj ) ;
/* After this point, attr should not be accessed. */
module_put ( owner ) ;
if ( buffer ) {
if ( buffer - > page )
free_page ( ( unsigned long ) buffer - > page ) ;
kfree ( buffer ) ;
}
return 0 ;
}
2006-03-20 17:53:53 +11:00
/* Sysfs attribute files are pollable. The idea is that you read
* the content and then you use ' poll ' or ' select ' to wait for
* the content to change . When the content changes ( assuming the
* manager for the kobject supports notification ) , poll will
* return POLLERR | POLLPRI , and select will return the fd whether
* it is waiting for read , write , or exceptions .
* Once poll / select indicates that the value has changed , you
* need to close and re - open the file , as simply seeking and reading
* again will not get new data , or reset the state of ' poll ' .
* Reminder : this only works for attributes which actively support
* it , and it is not possible to test an attribute from userspace
* to see if it supports poll ( Nether ' poll ' or ' select ' return
* an appropriate error code ) . When in doubt , set a suitable timeout value .
*/
static unsigned int sysfs_poll ( struct file * filp , poll_table * wait )
{
struct sysfs_buffer * buffer = filp - > private_data ;
struct kobject * kobj = to_kobj ( filp - > f_dentry - > d_parent ) ;
struct sysfs_dirent * sd = filp - > f_dentry - > d_fsdata ;
int res = 0 ;
poll_wait ( filp , & kobj - > poll , wait ) ;
if ( buffer - > event ! = atomic_read ( & sd - > s_event ) ) {
res = POLLERR | POLLPRI ;
buffer - > needs_read_fill = 1 ;
}
return res ;
}
static struct dentry * step_down ( struct dentry * dir , const char * name )
{
struct dentry * de ;
if ( dir = = NULL | | dir - > d_inode = = NULL )
return NULL ;
mutex_lock ( & dir - > d_inode - > i_mutex ) ;
de = lookup_one_len ( name , dir , strlen ( name ) ) ;
mutex_unlock ( & dir - > d_inode - > i_mutex ) ;
dput ( dir ) ;
if ( IS_ERR ( de ) )
return NULL ;
if ( de - > d_inode = = NULL ) {
dput ( de ) ;
return NULL ;
}
return de ;
}
void sysfs_notify ( struct kobject * k , char * dir , char * attr )
{
struct dentry * de = k - > dentry ;
if ( de )
dget ( de ) ;
if ( de & & dir )
de = step_down ( de , dir ) ;
if ( de & & attr )
de = step_down ( de , attr ) ;
if ( de ) {
struct sysfs_dirent * sd = de - > d_fsdata ;
if ( sd )
atomic_inc ( & sd - > s_event ) ;
wake_up_interruptible ( & k - > poll ) ;
dput ( de ) ;
}
}
EXPORT_SYMBOL_GPL ( sysfs_notify ) ;
2006-03-28 01:56:42 -08:00
const struct file_operations sysfs_file_operations = {
2005-04-16 15:20:36 -07:00
. read = sysfs_read_file ,
. write = sysfs_write_file ,
. llseek = generic_file_llseek ,
. open = sysfs_open_file ,
. release = sysfs_release ,
2006-03-20 17:53:53 +11:00
. poll = sysfs_poll ,
2005-04-16 15:20:36 -07:00
} ;
int sysfs_add_file ( struct dentry * dir , const struct attribute * attr , int type )
{
struct sysfs_dirent * parent_sd = dir - > d_fsdata ;
umode_t mode = ( attr - > mode & S_IALLUGO ) | S_IFREG ;
2006-03-09 19:40:14 +05:30
int error = - EEXIST ;
2005-04-16 15:20:36 -07:00
2006-01-09 15:59:24 -08:00
mutex_lock ( & dir - > d_inode - > i_mutex ) ;
2006-03-09 19:40:14 +05:30
if ( ! sysfs_dirent_exist ( parent_sd , attr - > name ) )
error = sysfs_make_dirent ( parent_sd , NULL , ( void * ) attr ,
mode , type ) ;
2006-01-09 15:59:24 -08:00
mutex_unlock ( & dir - > d_inode - > i_mutex ) ;
2005-04-16 15:20:36 -07:00
return error ;
}
/**
* sysfs_create_file - create an attribute file for an object .
* @ kobj : object we ' re creating for .
* @ attr : atrribute descriptor .
*/
int sysfs_create_file ( struct kobject * kobj , const struct attribute * attr )
{
BUG_ON ( ! kobj | | ! kobj - > dentry | | ! attr ) ;
return sysfs_add_file ( kobj - > dentry , attr , SYSFS_KOBJ_ATTR ) ;
}
/**
* sysfs_update_file - update the modified timestamp on an object attribute .
* @ kobj : object we ' re acting for .
* @ attr : attribute descriptor .
*/
int sysfs_update_file ( struct kobject * kobj , const struct attribute * attr )
{
struct dentry * dir = kobj - > dentry ;
struct dentry * victim ;
int res = - ENOENT ;
2006-01-09 15:59:24 -08:00
mutex_lock ( & dir - > d_inode - > i_mutex ) ;
2005-06-23 00:09:12 -07:00
victim = lookup_one_len ( attr - > name , dir , strlen ( attr - > name ) ) ;
2005-04-16 15:20:36 -07:00
if ( ! IS_ERR ( victim ) ) {
/* make sure dentry is really there */
if ( victim - > d_inode & &
( victim - > d_parent - > d_inode = = dir - > d_inode ) ) {
victim - > d_inode - > i_mtime = CURRENT_TIME ;
[PATCH] inotify
inotify is intended to correct the deficiencies of dnotify, particularly
its inability to scale and its terrible user interface:
* dnotify requires the opening of one fd per each directory
that you intend to watch. This quickly results in too many
open files and pins removable media, preventing unmount.
* dnotify is directory-based. You only learn about changes to
directories. Sure, a change to a file in a directory affects
the directory, but you are then forced to keep a cache of
stat structures.
* dnotify's interface to user-space is awful. Signals?
inotify provides a more usable, simple, powerful solution to file change
notification:
* inotify's interface is a system call that returns a fd, not SIGIO.
You get a single fd, which is select()-able.
* inotify has an event that says "the filesystem that the item
you were watching is on was unmounted."
* inotify can watch directories or files.
Inotify is currently used by Beagle (a desktop search infrastructure),
Gamin (a FAM replacement), and other projects.
See Documentation/filesystems/inotify.txt.
Signed-off-by: Robert Love <rml@novell.com>
Cc: John McCutchan <ttb@tentacle.dhs.org>
Cc: Christoph Hellwig <hch@lst.de>
Signed-off-by: Andrew Morton <akpm@osdl.org>
Signed-off-by: Linus Torvalds <torvalds@osdl.org>
2005-07-12 17:06:03 -04:00
fsnotify_modify ( victim ) ;
2005-04-16 15:20:36 -07:00
res = 0 ;
} else
d_drop ( victim ) ;
/**
2006-09-20 16:49:02 +09:00
* Drop the reference acquired from lookup_one_len ( ) above .
2005-04-16 15:20:36 -07:00
*/
dput ( victim ) ;
}
2006-01-09 15:59:24 -08:00
mutex_unlock ( & dir - > d_inode - > i_mutex ) ;
2005-04-16 15:20:36 -07:00
return res ;
}
2005-04-18 21:57:32 -07:00
/**
* sysfs_chmod_file - update the modified mode value on an object attribute .
* @ kobj : object we ' re acting for .
* @ attr : attribute descriptor .
* @ mode : file permissions .
*
*/
int sysfs_chmod_file ( struct kobject * kobj , struct attribute * attr , mode_t mode )
{
struct dentry * dir = kobj - > dentry ;
struct dentry * victim ;
2005-07-29 12:13:35 -07:00
struct inode * inode ;
struct iattr newattrs ;
2005-04-18 21:57:32 -07:00
int res = - ENOENT ;
2006-01-09 15:59:24 -08:00
mutex_lock ( & dir - > d_inode - > i_mutex ) ;
2005-06-23 00:09:12 -07:00
victim = lookup_one_len ( attr - > name , dir , strlen ( attr - > name ) ) ;
2005-04-18 21:57:32 -07:00
if ( ! IS_ERR ( victim ) ) {
if ( victim - > d_inode & &
( victim - > d_parent - > d_inode = = dir - > d_inode ) ) {
2005-07-29 12:13:35 -07:00
inode = victim - > d_inode ;
2006-01-09 15:59:24 -08:00
mutex_lock ( & inode - > i_mutex ) ;
2005-07-29 12:13:35 -07:00
newattrs . ia_mode = ( mode & S_IALLUGO ) |
( inode - > i_mode & ~ S_IALLUGO ) ;
newattrs . ia_valid = ATTR_MODE | ATTR_CTIME ;
res = notify_change ( victim , & newattrs ) ;
2006-01-09 15:59:24 -08:00
mutex_unlock ( & inode - > i_mutex ) ;
2005-04-18 21:57:32 -07:00
}
2005-07-29 12:13:35 -07:00
dput ( victim ) ;
2005-04-18 21:57:32 -07:00
}
2006-01-09 15:59:24 -08:00
mutex_unlock ( & dir - > d_inode - > i_mutex ) ;
2005-04-18 21:57:32 -07:00
return res ;
}
EXPORT_SYMBOL_GPL ( sysfs_chmod_file ) ;
2005-04-16 15:20:36 -07:00
/**
* sysfs_remove_file - remove an object attribute .
* @ kobj : object we ' re acting for .
* @ attr : attribute descriptor .
*
* Hash the attribute name and kill the victim .
*/
void sysfs_remove_file ( struct kobject * kobj , const struct attribute * attr )
{
sysfs_hash_and_remove ( kobj - > dentry , attr - > name ) ;
}
EXPORT_SYMBOL_GPL ( sysfs_create_file ) ;
EXPORT_SYMBOL_GPL ( sysfs_remove_file ) ;
EXPORT_SYMBOL_GPL ( sysfs_update_file ) ;