2015-07-17 10:38:12 -04:00
/*
* ( C ) 2001 Clemson University and The University of Chicago
*
* See COPYING in top - level directory .
*/
/*
* Linux VFS inode operations .
*/
# include "protocol.h"
2015-12-04 12:56:14 -05:00
# include "orangefs-kernel.h"
# include "orangefs-bufmap.h"
2015-07-17 10:38:12 -04:00
static int read_one_page ( struct page * page )
{
int ret ;
int max_block ;
ssize_t bytes_read = 0 ;
struct inode * inode = page - > mapping - > host ;
const __u32 blocksize = PAGE_CACHE_SIZE ; /* inode->i_blksize */
const __u32 blockbits = PAGE_CACHE_SHIFT ; /* inode->i_blkbits */
2015-10-08 18:31:05 -04:00
struct iov_iter to ;
struct bio_vec bv = { . bv_page = page , . bv_len = PAGE_SIZE } ;
iov_iter_bvec ( & to , ITER_BVEC | READ , & bv , 1 , PAGE_SIZE ) ;
2015-07-17 10:38:12 -04:00
gossip_debug ( GOSSIP_INODE_DEBUG ,
2015-11-24 15:12:14 -05:00
" orangefs_readpage called with page %p \n " ,
2015-07-17 10:38:12 -04:00
page ) ;
max_block = ( ( inode - > i_size / blocksize ) + 1 ) ;
if ( page - > index < max_block ) {
loff_t blockptr_offset = ( ( ( loff_t ) page - > index ) < < blockbits ) ;
2015-11-24 15:12:14 -05:00
bytes_read = orangefs_inode_read ( inode ,
& to ,
& blockptr_offset ,
inode - > i_size ) ;
2015-07-17 10:38:12 -04:00
}
2015-10-08 18:31:05 -04:00
/* this will only zero remaining unread portions of the page data */
iov_iter_zero ( ~ 0U , & to ) ;
2015-07-17 10:38:12 -04:00
/* takes care of potential aliasing */
flush_dcache_page ( page ) ;
if ( bytes_read < 0 ) {
ret = bytes_read ;
SetPageError ( page ) ;
} else {
SetPageUptodate ( page ) ;
if ( PageError ( page ) )
ClearPageError ( page ) ;
ret = 0 ;
}
/* unlock the page after the ->readpage() routine completes */
unlock_page ( page ) ;
return ret ;
}
2015-11-24 15:12:14 -05:00
static int orangefs_readpage ( struct file * file , struct page * page )
2015-07-17 10:38:12 -04:00
{
return read_one_page ( page ) ;
}
2015-11-24 15:12:14 -05:00
static int orangefs_readpages ( struct file * file ,
2015-07-17 10:38:12 -04:00
struct address_space * mapping ,
struct list_head * pages ,
unsigned nr_pages )
{
int page_idx ;
int ret ;
2015-11-24 15:12:14 -05:00
gossip_debug ( GOSSIP_INODE_DEBUG , " orangefs_readpages called \n " ) ;
2015-07-17 10:38:12 -04:00
for ( page_idx = 0 ; page_idx < nr_pages ; page_idx + + ) {
struct page * page ;
page = list_entry ( pages - > prev , struct page , lru ) ;
list_del ( & page - > lru ) ;
if ( ! add_to_page_cache ( page ,
mapping ,
page - > index ,
GFP_KERNEL ) ) {
ret = read_one_page ( page ) ;
gossip_debug ( GOSSIP_INODE_DEBUG ,
" failure adding page to cache, read_one_page returned: %d \n " ,
ret ) ;
} else {
page_cache_release ( page ) ;
}
}
BUG_ON ( ! list_empty ( pages ) ) ;
return 0 ;
}
2015-11-24 15:12:14 -05:00
static void orangefs_invalidatepage ( struct page * page ,
2015-07-17 10:38:12 -04:00
unsigned int offset ,
unsigned int length )
{
gossip_debug ( GOSSIP_INODE_DEBUG ,
2015-11-24 15:12:14 -05:00
" orangefs_invalidatepage called on page %p "
2015-07-17 10:38:12 -04:00
" (offset is %u) \n " ,
page ,
offset ) ;
ClearPageUptodate ( page ) ;
ClearPageMappedToDisk ( page ) ;
return ;
}
2015-11-24 15:12:14 -05:00
static int orangefs_releasepage ( struct page * page , gfp_t foo )
2015-07-17 10:38:12 -04:00
{
gossip_debug ( GOSSIP_INODE_DEBUG ,
2015-11-24 15:12:14 -05:00
" orangefs_releasepage called on page %p \n " ,
2015-07-17 10:38:12 -04:00
page ) ;
return 0 ;
}
/*
* Having a direct_IO entry point in the address_space_operations
* struct causes the kernel to allows us to use O_DIRECT on
* open . Nothing will ever call this thing , but in the future we
* will need to be able to use O_DIRECT on open in order to support
* AIO . Modeled after NFS , they do this too .
*/
/*
2015-12-04 12:56:14 -05:00
* static ssize_t orangefs_direct_IO ( int rw ,
2015-10-05 13:44:24 -04:00
* struct kiocb * iocb ,
* struct iov_iter * iter ,
* loff_t offset )
* {
* gossip_debug ( GOSSIP_INODE_DEBUG ,
2015-11-24 15:12:14 -05:00
* " orangefs_direct_IO: %s \n " ,
2015-10-05 13:44:24 -04:00
* iocb - > ki_filp - > f_path . dentry - > d_name . name ) ;
*
* return - EINVAL ;
* }
*/
2015-07-17 10:38:12 -04:00
2015-11-24 15:12:14 -05:00
struct backing_dev_info orangefs_backing_dev_info = {
. name = " orangefs " ,
2015-07-17 10:38:12 -04:00
. ra_pages = 0 ,
. capabilities = BDI_CAP_NO_ACCT_DIRTY | BDI_CAP_NO_WRITEBACK ,
} ;
2015-11-24 15:12:14 -05:00
/** ORANGEFS2 implementation of address space operations */
const struct address_space_operations orangefs_address_operations = {
. readpage = orangefs_readpage ,
. readpages = orangefs_readpages ,
. invalidatepage = orangefs_invalidatepage ,
. releasepage = orangefs_releasepage ,
2015-12-04 12:56:14 -05:00
/* .direct_IO = orangefs_direct_IO */
2015-07-17 10:38:12 -04:00
} ;
2015-11-24 15:12:14 -05:00
static int orangefs_setattr_size ( struct inode * inode , struct iattr * iattr )
2015-07-17 10:38:12 -04:00
{
2015-11-24 15:12:14 -05:00
struct orangefs_inode_s * orangefs_inode = ORANGEFS_I ( inode ) ;
struct orangefs_kernel_op_s * new_op ;
2015-07-17 10:38:12 -04:00
loff_t orig_size = i_size_read ( inode ) ;
int ret = - EINVAL ;
gossip_debug ( GOSSIP_INODE_DEBUG ,
" %s: %pU: Handle is %pU | fs_id %d | size is %llu \n " ,
__func__ ,
get_khandle_from_ino ( inode ) ,
2015-11-24 15:12:14 -05:00
& orangefs_inode - > refn . khandle ,
orangefs_inode - > refn . fs_id ,
2015-07-17 10:38:12 -04:00
iattr - > ia_size ) ;
truncate_setsize ( inode , iattr - > ia_size ) ;
2015-11-24 15:12:14 -05:00
new_op = op_alloc ( ORANGEFS_VFS_OP_TRUNCATE ) ;
2015-07-17 10:38:12 -04:00
if ( ! new_op )
return - ENOMEM ;
2015-11-24 15:12:14 -05:00
new_op - > upcall . req . truncate . refn = orangefs_inode - > refn ;
2015-07-17 10:38:12 -04:00
new_op - > upcall . req . truncate . size = ( __s64 ) iattr - > ia_size ;
ret = service_operation ( new_op , __func__ ,
get_interruptible_flag ( inode ) ) ;
/*
* the truncate has no downcall members to retrieve , but
* the status value tells us if it went through ok or not
*/
gossip_debug ( GOSSIP_INODE_DEBUG ,
2015-11-24 15:12:14 -05:00
" orangefs: orangefs_truncate got return value of %d \n " ,
2015-07-17 10:38:12 -04:00
ret ) ;
op_release ( new_op ) ;
if ( ret ! = 0 )
return ret ;
/*
* Only change the c / mtime if we are changing the size or we are
* explicitly asked to change it . This handles the semantic difference
* between truncate ( ) and ftruncate ( ) as implemented in the VFS .
*
* The regular truncate ( ) case without ATTR_CTIME and ATTR_MTIME is a
* special case where we need to update the times despite not having
* these flags set . For all other operations the VFS set these flags
* explicitly if it wants a timestamp update .
*/
if ( orig_size ! = i_size_read ( inode ) & &
! ( iattr - > ia_valid & ( ATTR_CTIME | ATTR_MTIME ) ) ) {
iattr - > ia_ctime = iattr - > ia_mtime =
current_fs_time ( inode - > i_sb ) ;
iattr - > ia_valid | = ATTR_CTIME | ATTR_MTIME ;
}
return ret ;
}
/*
* Change attributes of an object referenced by dentry .
*/
2015-11-24 15:12:14 -05:00
int orangefs_setattr ( struct dentry * dentry , struct iattr * iattr )
2015-07-17 10:38:12 -04:00
{
int ret = - EINVAL ;
struct inode * inode = dentry - > d_inode ;
gossip_debug ( GOSSIP_INODE_DEBUG ,
2015-11-24 15:12:14 -05:00
" orangefs_setattr: called on %s \n " ,
2015-07-17 10:38:12 -04:00
dentry - > d_name . name ) ;
ret = inode_change_ok ( inode , iattr ) ;
if ( ret )
goto out ;
if ( ( iattr - > ia_valid & ATTR_SIZE ) & &
iattr - > ia_size ! = i_size_read ( inode ) ) {
2015-11-24 15:12:14 -05:00
ret = orangefs_setattr_size ( inode , iattr ) ;
2015-07-17 10:38:12 -04:00
if ( ret )
goto out ;
}
setattr_copy ( inode , iattr ) ;
mark_inode_dirty ( inode ) ;
2015-11-24 15:12:14 -05:00
ret = orangefs_inode_setattr ( inode , iattr ) ;
2015-07-17 10:38:12 -04:00
gossip_debug ( GOSSIP_INODE_DEBUG ,
2015-11-24 15:12:14 -05:00
" orangefs_setattr: inode_setattr returned %d \n " ,
2015-07-17 10:38:12 -04:00
ret ) ;
if ( ! ret & & ( iattr - > ia_valid & ATTR_MODE ) )
/* change mod on a file that has ACLs */
ret = posix_acl_chmod ( inode , inode - > i_mode ) ;
out :
2015-11-24 15:12:14 -05:00
gossip_debug ( GOSSIP_INODE_DEBUG , " orangefs_setattr: returning %d \n " , ret ) ;
2015-07-17 10:38:12 -04:00
return ret ;
}
/*
* Obtain attributes of an object given a dentry
*/
2015-11-24 15:12:14 -05:00
int orangefs_getattr ( struct vfsmount * mnt ,
2015-07-17 10:38:12 -04:00
struct dentry * dentry ,
struct kstat * kstat )
{
int ret = - ENOENT ;
struct inode * inode = dentry - > d_inode ;
2015-11-24 15:12:14 -05:00
struct orangefs_inode_s * orangefs_inode = NULL ;
2015-07-17 10:38:12 -04:00
gossip_debug ( GOSSIP_INODE_DEBUG ,
2015-11-24 15:12:14 -05:00
" orangefs_getattr: called on %s \n " ,
2015-07-17 10:38:12 -04:00
dentry - > d_name . name ) ;
/*
* Similar to the above comment , a getattr also expects that all
* fields / attributes of the inode would be refreshed . So again , we
* dont have too much of a choice but refresh all the attributes .
*/
2015-11-24 15:12:14 -05:00
ret = orangefs_inode_getattr ( inode , ORANGEFS_ATTR_SYS_ALL_NOHINT ) ;
2015-07-17 10:38:12 -04:00
if ( ret = = 0 ) {
generic_fillattr ( inode , kstat ) ;
/* override block size reported to stat */
2015-11-24 15:12:14 -05:00
orangefs_inode = ORANGEFS_I ( inode ) ;
kstat - > blksize = orangefs_inode - > blksize ;
2015-07-17 10:38:12 -04:00
} else {
/* assume an I/O error and flag inode as bad */
gossip_debug ( GOSSIP_INODE_DEBUG ,
" %s:%s:%d calling make bad inode \n " ,
__FILE__ ,
__func__ ,
__LINE__ ) ;
2015-11-24 15:12:14 -05:00
orangefs_make_bad_inode ( inode ) ;
2015-07-17 10:38:12 -04:00
}
return ret ;
}
2015-11-24 15:12:14 -05:00
/* ORANGEDS2 implementation of VFS inode operations for files */
struct inode_operations orangefs_file_inode_operations = {
. get_acl = orangefs_get_acl ,
. set_acl = orangefs_set_acl ,
. setattr = orangefs_setattr ,
. getattr = orangefs_getattr ,
2015-07-17 10:38:12 -04:00
. setxattr = generic_setxattr ,
. getxattr = generic_getxattr ,
2015-11-24 15:12:14 -05:00
. listxattr = orangefs_listxattr ,
2015-07-17 10:38:12 -04:00
. removexattr = generic_removexattr ,
} ;
2015-11-24 15:12:14 -05:00
static int orangefs_init_iops ( struct inode * inode )
2015-07-17 10:38:12 -04:00
{
2015-11-24 15:12:14 -05:00
inode - > i_mapping - > a_ops = & orangefs_address_operations ;
2015-07-17 10:38:12 -04:00
switch ( inode - > i_mode & S_IFMT ) {
case S_IFREG :
2015-11-24 15:12:14 -05:00
inode - > i_op = & orangefs_file_inode_operations ;
inode - > i_fop = & orangefs_file_operations ;
2015-07-17 10:38:12 -04:00
inode - > i_blkbits = PAGE_CACHE_SHIFT ;
break ;
case S_IFLNK :
2015-11-24 15:12:14 -05:00
inode - > i_op = & orangefs_symlink_inode_operations ;
2015-07-17 10:38:12 -04:00
break ;
case S_IFDIR :
2015-11-24 15:12:14 -05:00
inode - > i_op = & orangefs_dir_inode_operations ;
inode - > i_fop = & orangefs_dir_operations ;
2015-07-17 10:38:12 -04:00
break ;
default :
gossip_debug ( GOSSIP_INODE_DEBUG ,
" %s: unsupported mode \n " ,
__func__ ) ;
return - EINVAL ;
}
return 0 ;
}
/*
2015-11-24 15:12:14 -05:00
* Given a ORANGEFS object identifier ( fsid , handle ) , convert it into a ino_t type
2015-07-17 10:38:12 -04:00
* that will be used as a hash - index from where the handle will
* be searched for in the VFS hash table of inodes .
*/
2015-11-24 15:12:14 -05:00
static inline ino_t orangefs_handle_hash ( struct orangefs_object_kref * ref )
2015-07-17 10:38:12 -04:00
{
if ( ! ref )
return 0 ;
2015-11-24 15:12:14 -05:00
return orangefs_khandle_to_ino ( & ( ref - > khandle ) ) ;
2015-07-17 10:38:12 -04:00
}
/*
* Called to set up an inode from iget5_locked .
*/
2015-11-24 15:12:14 -05:00
static int orangefs_set_inode ( struct inode * inode , void * data )
2015-07-17 10:38:12 -04:00
{
2015-11-24 15:12:14 -05:00
struct orangefs_object_kref * ref = ( struct orangefs_object_kref * ) data ;
struct orangefs_inode_s * orangefs_inode = NULL ;
2015-07-17 10:38:12 -04:00
/* Make sure that we have sane parameters */
if ( ! data | | ! inode )
return 0 ;
2015-11-24 15:12:14 -05:00
orangefs_inode = ORANGEFS_I ( inode ) ;
if ( ! orangefs_inode )
2015-07-17 10:38:12 -04:00
return 0 ;
2015-11-24 15:12:14 -05:00
orangefs_inode - > refn . fs_id = ref - > fs_id ;
orangefs_inode - > refn . khandle = ref - > khandle ;
2015-07-17 10:38:12 -04:00
return 0 ;
}
/*
* Called to determine if handles match .
*/
2015-11-24 15:12:14 -05:00
static int orangefs_test_inode ( struct inode * inode , void * data )
2015-07-17 10:38:12 -04:00
{
2015-11-24 15:12:14 -05:00
struct orangefs_object_kref * ref = ( struct orangefs_object_kref * ) data ;
struct orangefs_inode_s * orangefs_inode = NULL ;
2015-07-17 10:38:12 -04:00
2015-11-24 15:12:14 -05:00
orangefs_inode = ORANGEFS_I ( inode ) ;
return ( ! ORANGEFS_khandle_cmp ( & ( orangefs_inode - > refn . khandle ) , & ( ref - > khandle ) )
& & orangefs_inode - > refn . fs_id = = ref - > fs_id ) ;
2015-07-17 10:38:12 -04:00
}
/*
2015-11-24 15:12:14 -05:00
* Front - end to lookup the inode - cache maintained by the VFS using the ORANGEFS
2015-07-17 10:38:12 -04:00
* file handle .
*
* @ sb : the file system super block instance .
2015-11-24 15:12:14 -05:00
* @ ref : The ORANGEFS object for which we are trying to locate an inode structure .
2015-07-17 10:38:12 -04:00
*/
2015-11-24 15:12:14 -05:00
struct inode * orangefs_iget ( struct super_block * sb , struct orangefs_object_kref * ref )
2015-07-17 10:38:12 -04:00
{
struct inode * inode = NULL ;
unsigned long hash ;
int error ;
2015-11-24 15:12:14 -05:00
hash = orangefs_handle_hash ( ref ) ;
inode = iget5_locked ( sb , hash , orangefs_test_inode , orangefs_set_inode , ref ) ;
2015-07-17 10:38:12 -04:00
if ( ! inode | | ! ( inode - > i_state & I_NEW ) )
return inode ;
2015-11-24 15:12:14 -05:00
error = orangefs_inode_getattr ( inode , ORANGEFS_ATTR_SYS_ALL_NOHINT ) ;
2015-07-17 10:38:12 -04:00
if ( error ) {
iget_failed ( inode ) ;
return ERR_PTR ( error ) ;
}
inode - > i_ino = hash ; /* needed for stat etc */
2015-11-24 15:12:14 -05:00
orangefs_init_iops ( inode ) ;
2015-07-17 10:38:12 -04:00
unlock_new_inode ( inode ) ;
gossip_debug ( GOSSIP_INODE_DEBUG ,
" iget handle %pU, fsid %d hash %ld i_ino %lu \n " ,
& ref - > khandle ,
ref - > fs_id ,
hash ,
inode - > i_ino ) ;
return inode ;
}
/*
* Allocate an inode for a newly created file and insert it into the inode hash .
*/
2015-11-24 15:12:14 -05:00
struct inode * orangefs_new_inode ( struct super_block * sb , struct inode * dir ,
int mode , dev_t dev , struct orangefs_object_kref * ref )
2015-07-17 10:38:12 -04:00
{
2015-11-24 15:12:14 -05:00
unsigned long hash = orangefs_handle_hash ( ref ) ;
2015-07-17 10:38:12 -04:00
struct inode * inode ;
int error ;
gossip_debug ( GOSSIP_INODE_DEBUG ,
2015-11-24 15:12:14 -05:00
" orangefs_get_custom_inode_common: called \n "
2015-07-17 10:38:12 -04:00
" (sb is %p | MAJOR(dev)=%u | MINOR(dev)=%u mode=%o) \n " ,
sb ,
MAJOR ( dev ) ,
MINOR ( dev ) ,
mode ) ;
inode = new_inode ( sb ) ;
if ( ! inode )
return NULL ;
2015-11-24 15:12:14 -05:00
orangefs_set_inode ( inode , ref ) ;
2015-07-17 10:38:12 -04:00
inode - > i_ino = hash ; /* needed for stat etc */
2015-11-24 15:12:14 -05:00
error = orangefs_inode_getattr ( inode , ORANGEFS_ATTR_SYS_ALL_NOHINT ) ;
2015-07-17 10:38:12 -04:00
if ( error )
goto out_iput ;
2015-11-24 15:12:14 -05:00
orangefs_init_iops ( inode ) ;
2015-07-17 10:38:12 -04:00
inode - > i_mode = mode ;
inode - > i_uid = current_fsuid ( ) ;
inode - > i_gid = current_fsgid ( ) ;
inode - > i_atime = inode - > i_mtime = inode - > i_ctime = CURRENT_TIME ;
inode - > i_size = PAGE_CACHE_SIZE ;
inode - > i_rdev = dev ;
2015-11-24 15:12:14 -05:00
error = insert_inode_locked4 ( inode , hash , orangefs_test_inode , ref ) ;
2015-07-17 10:38:12 -04:00
if ( error < 0 )
goto out_iput ;
gossip_debug ( GOSSIP_INODE_DEBUG ,
" Initializing ACL's for inode %pU \n " ,
get_khandle_from_ino ( inode ) ) ;
2015-11-24 15:12:14 -05:00
orangefs_init_acl ( inode , dir ) ;
2015-07-17 10:38:12 -04:00
return inode ;
out_iput :
iput ( inode ) ;
return ERR_PTR ( error ) ;
}