2005-12-15 14:31:24 -08:00
/* -*- mode: c; c-basic-offset: 8; -*-
* vim : noexpandtab sw = 8 ts = 8 sts = 0 :
*
* mmap . c
*
* Code to deal with the mess that is clustered mmap .
*
* Copyright ( C ) 2002 , 2004 Oracle . All rights reserved .
*
* This program is free software ; you can redistribute it and / or
* modify it under the terms of the GNU General Public
* License as published by the Free Software Foundation ; either
* version 2 of the License , or ( at your option ) any later version .
*
* This program is distributed in the hope that it will be useful ,
* but WITHOUT ANY WARRANTY ; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE . See the GNU
* General Public License for more details .
*
* You should have received a copy of the GNU General Public
* License along with this program ; if not , write to the
* Free Software Foundation , Inc . , 59 Temple Place - Suite 330 ,
* Boston , MA 021110 - 1307 , USA .
*/
# include <linux/fs.h>
# include <linux/types.h>
# include <linux/highmem.h>
# include <linux/pagemap.h>
# include <linux/uio.h>
# include <linux/signal.h>
# include <linux/rbtree.h>
# include <cluster/masklog.h>
# include "ocfs2.h"
2007-05-09 15:16:19 -07:00
# include "aops.h"
2005-12-15 14:31:24 -08:00
# include "dlmglue.h"
# include "file.h"
# include "inode.h"
# include "mmap.h"
2009-09-02 17:17:36 -07:00
# include "super.h"
2011-02-22 21:59:46 +08:00
# include "ocfs2_trace.h"
2005-12-15 14:31:24 -08:00
2007-05-09 15:16:19 -07:00
2007-07-19 01:47:03 -07:00
static int ocfs2_fault ( struct vm_area_struct * area , struct vm_fault * vmf )
2005-12-15 14:31:24 -08:00
{
2009-09-02 17:17:36 -07:00
sigset_t oldset ;
int ret ;
2005-12-15 14:31:24 -08:00
2009-09-02 17:17:36 -07:00
ocfs2_block_signals ( & oldset ) ;
2007-07-19 01:47:03 -07:00
ret = filemap_fault ( area , vmf ) ;
2009-09-02 17:17:36 -07:00
ocfs2_unblock_signals ( & oldset ) ;
2005-12-15 14:31:24 -08:00
2011-02-22 21:59:46 +08:00
trace_ocfs2_fault ( OCFS2_I ( area - > vm_file - > f_mapping - > host ) - > ip_blkno ,
area , vmf - > page , vmf - > pgoff ) ;
2007-07-19 01:47:03 -07:00
return ret ;
2005-12-15 14:31:24 -08:00
}
2010-08-12 10:25:28 +08:00
static int __ocfs2_page_mkwrite ( struct file * file , struct buffer_head * di_bh ,
2007-05-09 15:16:19 -07:00
struct page * page )
{
2011-07-24 10:36:54 -07:00
int ret = VM_FAULT_NOPAGE ;
2010-08-12 10:25:28 +08:00
struct inode * inode = file - > f_path . dentry - > d_inode ;
2007-05-09 15:16:19 -07:00
struct address_space * mapping = inode - > i_mapping ;
2007-07-20 00:31:45 -07:00
loff_t pos = page_offset ( page ) ;
2007-05-09 15:16:19 -07:00
unsigned int len = PAGE_CACHE_SIZE ;
pgoff_t last_index ;
struct page * locked_page = NULL ;
void * fsdata ;
loff_t size = i_size_read ( inode ) ;
2005-12-15 14:31:24 -08:00
2010-07-17 21:45:49 +08:00
last_index = ( size - 1 ) > > PAGE_CACHE_SHIFT ;
2007-05-09 15:16:19 -07:00
/*
2011-07-24 10:36:54 -07:00
* There are cases that lead to the page no longer bebongs to the
* mapping .
* 1 ) pagecache truncates locally due to memory pressure .
* 2 ) pagecache truncates when another is taking EX lock against
* inode lock . see ocfs2_data_convert_worker .
*
* The i_size check doesn ' t catch the case where nodes truncated and
* then re - extended the file . We ' ll re - check the page mapping after
* taking the page lock inside of ocfs2_write_begin_nolock ( ) .
*
* Let VM retry with these cases .
2007-05-09 15:16:19 -07:00
*/
2011-07-24 10:36:54 -07:00
if ( ( page - > mapping ! = inode - > i_mapping ) | |
( ! PageUptodate ( page ) ) | |
( page_offset ( page ) > = size ) )
2007-05-09 15:16:19 -07:00
goto out ;
/*
* Call ocfs2_write_begin ( ) and ocfs2_write_end ( ) to take
* advantage of the allocation code there . We pass a write
* length of the whole page ( chopped to i_size ) to make sure
* the whole thing is allocated .
*
* Since we know the page is up to date , we don ' t have to
* worry about ocfs2_write_begin ( ) skipping some buffer reads
* because the " write " would invalidate their data .
*/
if ( page - > index = = last_index )
2010-07-17 21:45:49 +08:00
len = ( ( size - 1 ) & ~ PAGE_CACHE_MASK ) + 1 ;
2007-05-09 15:16:19 -07:00
2010-08-12 10:25:28 +08:00
ret = ocfs2_write_begin_nolock ( file , mapping , pos , len , 0 , & locked_page ,
2007-05-09 15:16:19 -07:00
& fsdata , di_bh , page ) ;
if ( ret ) {
if ( ret ! = - ENOSPC )
mlog_errno ( ret ) ;
2011-07-24 10:36:54 -07:00
if ( ret = = - ENOMEM )
ret = VM_FAULT_OOM ;
else
ret = VM_FAULT_SIGBUS ;
2007-05-09 15:16:19 -07:00
goto out ;
}
2011-07-24 10:36:54 -07:00
if ( ! locked_page ) {
ret = VM_FAULT_NOPAGE ;
2007-05-09 15:16:19 -07:00
goto out ;
}
2011-07-24 10:36:54 -07:00
ret = ocfs2_write_end_nolock ( mapping , pos , len , len , locked_page ,
fsdata ) ;
2007-05-09 15:16:19 -07:00
BUG_ON ( ret ! = len ) ;
2011-07-24 10:36:54 -07:00
ret = VM_FAULT_LOCKED ;
2007-05-09 15:16:19 -07:00
out :
return ret ;
}
2009-03-31 15:23:21 -07:00
static int ocfs2_page_mkwrite ( struct vm_area_struct * vma , struct vm_fault * vmf )
2005-12-15 14:31:24 -08:00
{
2009-03-31 15:23:21 -07:00
struct page * page = vmf - > page ;
2007-05-09 15:16:19 -07:00
struct inode * inode = vma - > vm_file - > f_path . dentry - > d_inode ;
struct buffer_head * di_bh = NULL ;
2009-09-02 17:17:36 -07:00
sigset_t oldset ;
int ret ;
2007-05-09 15:16:19 -07:00
2012-06-12 16:20:40 +02:00
sb_start_pagefault ( inode - > i_sb ) ;
2009-09-02 17:17:36 -07:00
ocfs2_block_signals ( & oldset ) ;
2007-05-09 15:16:19 -07:00
/*
* The cluster locks taken will block a truncate from another
* node . Taking the data lock will also ensure that we don ' t
* attempt page truncation as part of a downconvert .
*/
2007-10-18 15:30:42 -07:00
ret = ocfs2_inode_lock ( inode , & di_bh , 1 ) ;
2007-05-09 15:16:19 -07:00
if ( ret < 0 ) {
mlog_errno ( ret ) ;
goto out ;
}
2006-11-15 15:49:02 +08:00
2007-01-17 13:10:55 -08:00
/*
2007-05-09 15:16:19 -07:00
* The alloc sem should be enough to serialize with
* ocfs2_truncate_file ( ) changing i_size as well as any thread
* modifying the inode btree .
2007-01-17 13:10:55 -08:00
*/
2007-05-09 15:16:19 -07:00
down_write ( & OCFS2_I ( inode ) - > ip_alloc_sem ) ;
2010-08-12 10:25:28 +08:00
ret = __ocfs2_page_mkwrite ( vma - > vm_file , di_bh , page ) ;
2007-05-09 15:16:19 -07:00
up_write ( & OCFS2_I ( inode ) - > ip_alloc_sem ) ;
brelse ( di_bh ) ;
2007-10-18 15:30:42 -07:00
ocfs2_inode_unlock ( inode , 1 ) ;
2007-05-09 15:16:19 -07:00
out :
2009-09-02 17:17:36 -07:00
ocfs2_unblock_signals ( & oldset ) ;
2012-06-12 16:20:40 +02:00
sb_end_pagefault ( inode - > i_sb ) ;
2007-05-09 15:16:19 -07:00
return ret ;
}
2009-09-27 22:29:37 +04:00
static const struct vm_operations_struct ocfs2_file_vm_ops = {
2007-07-19 01:46:59 -07:00
. fault = ocfs2_fault ,
2007-05-09 15:16:19 -07:00
. page_mkwrite = ocfs2_page_mkwrite ,
2012-10-08 16:28:46 -07:00
. remap_pages = generic_file_remap_pages ,
2007-05-09 15:16:19 -07:00
} ;
int ocfs2_mmap ( struct file * file , struct vm_area_struct * vma )
{
int ret = 0 , lock_level = 0 ;
2007-10-18 15:30:42 -07:00
ret = ocfs2_inode_lock_atime ( file - > f_dentry - > d_inode ,
2006-11-15 15:49:02 +08:00
file - > f_vfsmnt , & lock_level ) ;
if ( ret < 0 ) {
mlog_errno ( ret ) ;
goto out ;
}
2007-10-18 15:30:42 -07:00
ocfs2_inode_unlock ( file - > f_dentry - > d_inode , lock_level ) ;
2006-11-15 15:49:02 +08:00
out :
2005-12-15 14:31:24 -08:00
vma - > vm_ops = & ocfs2_file_vm_ops ;
return 0 ;
}