2006-10-11 01:20:57 -07:00
/*
2008-04-29 18:13:32 -04:00
* ext4_jbd2 . h
2006-10-11 01:20:57 -07:00
*
* Written by Stephen C . Tweedie < sct @ redhat . com > , 1999
*
* Copyright 1998 - - 1999 Red Hat corp - - - All Rights Reserved
*
* This file is part of the Linux kernel and is made available under
* the terms of the GNU General Public License , version 2 , or at your
* option , any later version , incorporated herein by reference .
*
* Ext4 - specific journaling extensions .
*/
2008-04-29 18:13:32 -04:00
# ifndef _EXT4_JBD2_H
# define _EXT4_JBD2_H
2006-10-11 01:20:57 -07:00
# include <linux/fs.h>
2006-10-11 01:20:59 -07:00
# include <linux/jbd2.h>
2008-04-29 18:13:32 -04:00
# include "ext4.h"
2006-10-11 01:20:57 -07:00
# define EXT4_JOURNAL(inode) (EXT4_SB((inode)->i_sb)->s_journal)
/* Define the number of blocks we need to account to a transaction to
* modify one block of data .
*
* We may have to touch one inode , one bitmap buffer , up to three
* indirection blocks , the group and superblock summaries , and the data
2006-10-11 01:21:03 -07:00
* block to complete the transaction .
*
2006-10-11 01:21:07 -07:00
* For extents - enabled fs we may have to allocate and modify up to
* 5 levels of tree + root which are stored in the inode . */
2006-10-11 01:20:57 -07:00
2006-10-11 01:21:03 -07:00
# define EXT4_SINGLEDATA_TRANS_BLOCKS(sb) \
2009-01-06 14:53:16 -05:00
( EXT4_HAS_INCOMPAT_FEATURE ( sb , EXT4_FEATURE_INCOMPAT_EXTENTS ) \
? 27U : 8U )
2006-10-11 01:20:57 -07:00
/* Extended attribute operations touch at most two data buffers,
* two bitmap buffers , and two group summaries , in addition to the inode
* and the superblock , which are already accounted for . */
# define EXT4_XATTR_TRANS_BLOCKS 6U
/* Define the minimum size for a transaction which modifies data. This
* needs to take into account the fact that we may end up modifying two
* quota files too ( one for the group , one for the user quota ) . The
* superblock only gets updated once , of course , so don ' t bother
* counting that again for the quota updates . */
2006-10-11 01:21:03 -07:00
# define EXT4_DATA_TRANS_BLOCKS(sb) (EXT4_SINGLEDATA_TRANS_BLOCKS(sb) + \
2006-10-11 01:20:57 -07:00
EXT4_XATTR_TRANS_BLOCKS - 2 + \
2009-12-08 22:42:15 -05:00
EXT4_MAXQUOTAS_TRANS_BLOCKS ( sb ) )
2006-10-11 01:20:57 -07:00
ext4: journal credits calulation cleanup and fix for non-extent writepage
When considering how many journal credits are needed for modifying a
chunk of data, we need to account for the super block, inode block,
quota blocks and xattr block, indirect/index blocks, also, group bitmap
and group descriptor blocks for new allocation (including data and
indirect/index blocks). There are many places in ext4 do the calculation
on their own and often missed one or two meta blocks, and often they
assume single block allocation, and did not considering the multile
chunk of allocation case.
This patch is trying to cleanup current journal credit code, provides
some common helper funtion to calculate the journal credits, to be used
for writepage, writepages, DIO, fallocate, migration, defrag, and for
both nonextent and extent files.
This patch modified the writepage/write_begin credit caculation for
nonextent files, to use the new helper function. It also fixed the
problem that writepage on nonextent files did not consider the case
blocksize <pagesize, thus could possibelly need multiple block
allocation in a single transaction.
Signed-off-by: Mingming Cao <cmm@us.ibm.com>
Reviewed-by: Aneesh Kumar K.V <aneesh.kumar@linux.vnet.ibm.com>
Signed-off-by: "Theodore Ts'o" <tytso@mit.edu>
2008-08-19 22:16:07 -04:00
/*
* Define the number of metadata blocks we need to account to modify data .
*
* This include super block , inode block , quota blocks and xattr blocks
*/
# define EXT4_META_TRANS_BLOCKS(sb) (EXT4_XATTR_TRANS_BLOCKS + \
2009-12-08 22:42:15 -05:00
EXT4_MAXQUOTAS_TRANS_BLOCKS ( sb ) )
ext4: journal credits calulation cleanup and fix for non-extent writepage
When considering how many journal credits are needed for modifying a
chunk of data, we need to account for the super block, inode block,
quota blocks and xattr block, indirect/index blocks, also, group bitmap
and group descriptor blocks for new allocation (including data and
indirect/index blocks). There are many places in ext4 do the calculation
on their own and often missed one or two meta blocks, and often they
assume single block allocation, and did not considering the multile
chunk of allocation case.
This patch is trying to cleanup current journal credit code, provides
some common helper funtion to calculate the journal credits, to be used
for writepage, writepages, DIO, fallocate, migration, defrag, and for
both nonextent and extent files.
This patch modified the writepage/write_begin credit caculation for
nonextent files, to use the new helper function. It also fixed the
problem that writepage on nonextent files did not consider the case
blocksize <pagesize, thus could possibelly need multiple block
allocation in a single transaction.
Signed-off-by: Mingming Cao <cmm@us.ibm.com>
Reviewed-by: Aneesh Kumar K.V <aneesh.kumar@linux.vnet.ibm.com>
Signed-off-by: "Theodore Ts'o" <tytso@mit.edu>
2008-08-19 22:16:07 -04:00
2006-10-11 01:20:57 -07:00
/* Delete operations potentially hit one directory's namespace plus an
* entire inode , plus arbitrary amounts of bitmap / indirection data . Be
* generous . We can grow the delete transaction later if necessary . */
# define EXT4_DELETE_TRANS_BLOCKS(sb) (2 * EXT4_DATA_TRANS_BLOCKS(sb) + 64)
/* Define an arbitrary limit for the amount of data we will anticipate
* writing to any given transaction . For unbounded transactions such as
* write ( 2 ) and truncate ( 2 ) we can write more than this , but we always
* start off at the maximum transaction size and grow the transaction
* optimistically as we go . */
# define EXT4_MAX_TRANS_DATA 64U
/* We break up a large truncate or write transaction once the handle's
* buffer credits gets this low , we need either to extend the
* transaction or to start a new one . Reserve enough space here for
* inode , bitmap , superblock , group and indirection updates for at least
* one block , plus two quota updates . Quota allocations are not
* needed . */
# define EXT4_RESERVE_TRANS_BLOCKS 12U
# define EXT4_INDEX_EXTRA_TRANS_BLOCKS 8
# ifdef CONFIG_QUOTA
/* Amount of blocks needed for quota update - we know that the structure was
2011-04-04 15:33:39 -04:00
* allocated so we need to update only data block */
# define EXT4_QUOTA_TRANS_BLOCKS(sb) (test_opt(sb, QUOTA) ? 1 : 0)
2006-10-11 01:20:57 -07:00
/* Amount of blocks needed for quota insert/delete - we do some block writes
* but inode , sb and group updates are done only once */
# define EXT4_QUOTA_INIT_BLOCKS(sb) (test_opt(sb, QUOTA) ? (DQUOT_INIT_ALLOC*\
2006-10-11 01:21:03 -07:00
( EXT4_SINGLEDATA_TRANS_BLOCKS ( sb ) - 3 ) + 3 + DQUOT_INIT_REWRITE ) : 0 )
2009-12-08 22:42:15 -05:00
2006-10-11 01:20:57 -07:00
# define EXT4_QUOTA_DEL_BLOCKS(sb) (test_opt(sb, QUOTA) ? (DQUOT_DEL_ALLOC*\
2006-10-11 01:21:03 -07:00
( EXT4_SINGLEDATA_TRANS_BLOCKS ( sb ) - 3 ) + 3 + DQUOT_DEL_REWRITE ) : 0 )
2006-10-11 01:20:57 -07:00
# else
# define EXT4_QUOTA_TRANS_BLOCKS(sb) 0
# define EXT4_QUOTA_INIT_BLOCKS(sb) 0
# define EXT4_QUOTA_DEL_BLOCKS(sb) 0
# endif
2009-12-08 22:42:15 -05:00
# define EXT4_MAXQUOTAS_TRANS_BLOCKS(sb) (MAXQUOTAS*EXT4_QUOTA_TRANS_BLOCKS(sb))
# define EXT4_MAXQUOTAS_INIT_BLOCKS(sb) (MAXQUOTAS*EXT4_QUOTA_INIT_BLOCKS(sb))
# define EXT4_MAXQUOTAS_DEL_BLOCKS(sb) (MAXQUOTAS*EXT4_QUOTA_DEL_BLOCKS(sb))
2006-10-11 01:20:57 -07:00
int
ext4_mark_iloc_dirty ( handle_t * handle ,
struct inode * inode ,
struct ext4_iloc * iloc ) ;
/*
* On success , We end up with an outstanding reference count against
* iloc - > bh . This _must_ be cleaned up later .
*/
int ext4_reserve_inode_write ( handle_t * handle , struct inode * inode ,
struct ext4_iloc * iloc ) ;
int ext4_mark_inode_dirty ( handle_t * handle , struct inode * inode ) ;
/*
2009-11-24 11:05:59 -05:00
* Wrapper functions with which ext4 calls into JBD .
2006-10-11 01:20:57 -07:00
*/
2010-06-29 14:53:24 -04:00
void ext4_journal_abort_handle ( const char * caller , unsigned int line ,
const char * err_fn ,
2006-12-06 20:37:15 -08:00
struct buffer_head * bh , handle_t * handle , int err ) ;
2006-10-11 01:20:57 -07:00
2010-06-29 14:53:24 -04:00
int __ext4_journal_get_write_access ( const char * where , unsigned int line ,
handle_t * handle , struct buffer_head * bh ) ;
2006-10-11 01:20:57 -07:00
2010-06-29 14:53:24 -04:00
int __ext4_forget ( const char * where , unsigned int line , handle_t * handle ,
int is_metadata , struct inode * inode ,
struct buffer_head * bh , ext4_fsblk_t blocknr ) ;
2009-11-22 20:52:12 -05:00
2010-06-29 14:53:24 -04:00
int __ext4_journal_get_create_access ( const char * where , unsigned int line ,
2006-12-06 20:37:15 -08:00
handle_t * handle , struct buffer_head * bh ) ;
2006-10-11 01:20:57 -07:00
2010-06-29 14:53:24 -04:00
int __ext4_handle_dirty_metadata ( const char * where , unsigned int line ,
handle_t * handle , struct inode * inode ,
struct buffer_head * bh ) ;
2006-10-11 01:20:57 -07:00
2010-06-29 14:53:24 -04:00
int __ext4_handle_dirty_super ( const char * where , unsigned int line ,
handle_t * handle , struct super_block * sb ) ;
2010-06-11 23:14:04 -04:00
2006-10-11 01:20:57 -07:00
# define ext4_journal_get_write_access(handle, bh) \
2010-06-29 14:53:24 -04:00
__ext4_journal_get_write_access ( __func__ , __LINE__ , ( handle ) , ( bh ) )
2009-11-22 20:52:12 -05:00
# define ext4_forget(handle, is_metadata, inode, bh, block_nr) \
2010-06-29 14:53:24 -04:00
__ext4_forget ( __func__ , __LINE__ , ( handle ) , ( is_metadata ) , ( inode ) , \
( bh ) , ( block_nr ) )
2006-10-11 01:20:57 -07:00
# define ext4_journal_get_create_access(handle, bh) \
2010-06-29 14:53:24 -04:00
__ext4_journal_get_create_access ( __func__ , __LINE__ , ( handle ) , ( bh ) )
2009-01-07 00:06:22 -05:00
# define ext4_handle_dirty_metadata(handle, inode, bh) \
2010-06-29 14:53:24 -04:00
__ext4_handle_dirty_metadata ( __func__ , __LINE__ , ( handle ) , ( inode ) , \
( bh ) )
2010-06-11 23:14:04 -04:00
# define ext4_handle_dirty_super(handle, sb) \
2010-06-29 14:53:24 -04:00
__ext4_handle_dirty_super ( __func__ , __LINE__ , ( handle ) , ( sb ) )
2006-10-11 01:20:57 -07:00
handle_t * ext4_journal_start_sb ( struct super_block * sb , int nblocks ) ;
2010-07-27 11:56:40 -04:00
int __ext4_journal_stop ( const char * where , unsigned int line , handle_t * handle ) ;
2006-10-11 01:20:57 -07:00
2009-09-29 11:01:03 -04:00
# define EXT4_NOJOURNAL_MAX_REF_COUNT ((unsigned long) 4096)
2009-01-07 00:06:22 -05:00
2009-09-29 11:01:03 -04:00
/* Note: Do not use this for NULL handles. This is only to determine if
* a properly allocated handle is using a journal or not . */
2009-01-07 00:06:22 -05:00
static inline int ext4_handle_valid ( handle_t * handle )
{
2009-09-29 11:01:03 -04:00
if ( ( unsigned long ) handle < EXT4_NOJOURNAL_MAX_REF_COUNT )
2009-01-07 00:06:22 -05:00
return 0 ;
return 1 ;
}
static inline void ext4_handle_sync ( handle_t * handle )
{
if ( ext4_handle_valid ( handle ) )
handle - > h_sync = 1 ;
}
static inline void ext4_handle_release_buffer ( handle_t * handle ,
struct buffer_head * bh )
{
if ( ext4_handle_valid ( handle ) )
jbd2_journal_release_buffer ( handle , bh ) ;
}
static inline int ext4_handle_is_aborted ( handle_t * handle )
{
if ( ext4_handle_valid ( handle ) )
return is_handle_aborted ( handle ) ;
return 0 ;
}
static inline int ext4_handle_has_enough_credits ( handle_t * handle , int needed )
{
if ( ext4_handle_valid ( handle ) & & handle - > h_buffer_credits < needed )
return 0 ;
return 1 ;
}
2006-10-11 01:20:57 -07:00
static inline handle_t * ext4_journal_start ( struct inode * inode , int nblocks )
{
return ext4_journal_start_sb ( inode - > i_sb , nblocks ) ;
}
# define ext4_journal_stop(handle) \
2010-07-27 11:56:40 -04:00
__ext4_journal_stop ( __func__ , __LINE__ , ( handle ) )
2006-10-11 01:20:57 -07:00
static inline handle_t * ext4_journal_current_handle ( void )
{
return journal_current_handle ( ) ;
}
static inline int ext4_journal_extend ( handle_t * handle , int nblocks )
{
2009-01-07 00:06:22 -05:00
if ( ext4_handle_valid ( handle ) )
return jbd2_journal_extend ( handle , nblocks ) ;
return 0 ;
2006-10-11 01:20:57 -07:00
}
static inline int ext4_journal_restart ( handle_t * handle , int nblocks )
{
2009-01-07 00:06:22 -05:00
if ( ext4_handle_valid ( handle ) )
return jbd2_journal_restart ( handle , nblocks ) ;
return 0 ;
2006-10-11 01:20:57 -07:00
}
static inline int ext4_journal_blocks_per_page ( struct inode * inode )
{
2009-01-07 00:06:22 -05:00
if ( EXT4_JOURNAL ( inode ) ! = NULL )
return jbd2_journal_blocks_per_page ( inode ) ;
return 0 ;
2006-10-11 01:20:57 -07:00
}
static inline int ext4_journal_force_commit ( journal_t * journal )
{
2009-01-07 00:06:22 -05:00
if ( journal )
return jbd2_journal_force_commit ( journal ) ;
return 0 ;
2006-10-11 01:20:57 -07:00
}
2008-07-11 19:27:31 -04:00
static inline int ext4_jbd2_file_inode ( handle_t * handle , struct inode * inode )
{
2009-01-07 00:06:22 -05:00
if ( ext4_handle_valid ( handle ) )
2011-01-10 12:29:43 -05:00
return jbd2_journal_file_inode ( handle , EXT4_I ( inode ) - > jinode ) ;
2009-01-07 00:06:22 -05:00
return 0 ;
2008-07-11 19:27:31 -04:00
}
2009-12-08 23:51:10 -05:00
static inline void ext4_update_inode_fsync_trans ( handle_t * handle ,
struct inode * inode ,
int datasync )
{
struct ext4_inode_info * ei = EXT4_I ( inode ) ;
if ( ext4_handle_valid ( handle ) ) {
ei - > i_sync_tid = handle - > h_transaction - > t_tid ;
if ( datasync )
ei - > i_datasync_tid = handle - > h_transaction - > t_tid ;
}
}
2006-10-11 01:20:57 -07:00
/* super.c */
int ext4_force_commit ( struct super_block * sb ) ;
static inline int ext4_should_journal_data ( struct inode * inode )
{
2009-01-07 00:06:22 -05:00
if ( EXT4_JOURNAL ( inode ) = = NULL )
return 0 ;
2006-10-11 01:20:57 -07:00
if ( ! S_ISREG ( inode - > i_mode ) )
return 1 ;
if ( test_opt ( inode - > i_sb , DATA_FLAGS ) = = EXT4_MOUNT_JOURNAL_DATA )
return 1 ;
2010-05-16 22:00:00 -04:00
if ( ext4_test_inode_flag ( inode , EXT4_INODE_JOURNAL_DATA ) )
2006-10-11 01:20:57 -07:00
return 1 ;
return 0 ;
}
static inline int ext4_should_order_data ( struct inode * inode )
{
2009-01-07 00:06:22 -05:00
if ( EXT4_JOURNAL ( inode ) = = NULL )
return 0 ;
2006-10-11 01:20:57 -07:00
if ( ! S_ISREG ( inode - > i_mode ) )
return 0 ;
2010-05-16 22:00:00 -04:00
if ( ext4_test_inode_flag ( inode , EXT4_INODE_JOURNAL_DATA ) )
2006-10-11 01:20:57 -07:00
return 0 ;
if ( test_opt ( inode - > i_sb , DATA_FLAGS ) = = EXT4_MOUNT_ORDERED_DATA )
return 1 ;
return 0 ;
}
static inline int ext4_should_writeback_data ( struct inode * inode )
{
2009-07-08 17:11:24 -04:00
if ( EXT4_JOURNAL ( inode ) = = NULL )
return 1 ;
ext4: Fix ext4_should_writeback_data() for no-journal mode
ext4_should_writeback_data() had an incorrect sequence of
tests to determine if it should return 0 or 1: in
particular, even in no-journal mode, 0 was being returned
for a non-regular-file inode.
This meant that, in non-journal mode, we would use
ext4_journalled_aops for directories, symlinks, and other
non-regular files. However, calling journalled aop
callbacks when there is no valid handle, can cause problems.
This would cause a kernel crash with Jan Kara's commit
2d859db3e4 ("ext4: fix data corruption in inodes with
journalled data"), because we now dereference 'handle' in
ext4_journalled_write_end().
I also added BUG_ONs to check for a valid handle in the
obviously journal-only aops callbacks.
I tested this running xfstests with a scratch device in
these modes:
- no-journal
- data=ordered
- data=writeback
- data=journal
All work fine; the data=journal run has many failures and a
crash in xfstests 074, but this is no different from a
vanilla kernel.
Signed-off-by: Curt Wohlgemuth <curtw@google.com>
Signed-off-by: "Theodore Ts'o" <tytso@mit.edu>
Cc: stable@kernel.org
2011-08-13 11:25:18 -04:00
if ( ! S_ISREG ( inode - > i_mode ) )
return 0 ;
2010-05-16 22:00:00 -04:00
if ( ext4_test_inode_flag ( inode , EXT4_INODE_JOURNAL_DATA ) )
2006-10-11 01:20:57 -07:00
return 0 ;
if ( test_opt ( inode - > i_sb , DATA_FLAGS ) = = EXT4_MOUNT_WRITEBACK_DATA )
return 1 ;
return 0 ;
}
2010-03-04 16:14:02 -05:00
/*
* This function controls whether or not we should try to go down the
* dioread_nolock code paths , which makes it safe to avoid taking
* i_mutex for direct I / O reads . This only works for extent - based
2010-06-14 14:42:49 -04:00
* files , and it doesn ' t work if data journaling is enabled , since the
* dioread_nolock code uses b_private to pass information back to the
* I / O completion handler , and this conflicts with the jbd ' s use of
* b_private .
2010-03-04 16:14:02 -05:00
*/
static inline int ext4_should_dioread_nolock ( struct inode * inode )
{
if ( ! test_opt ( inode - > i_sb , DIOREAD_NOLOCK ) )
return 0 ;
if ( ! S_ISREG ( inode - > i_mode ) )
return 0 ;
2010-05-16 22:00:00 -04:00
if ( ! ( ext4_test_inode_flag ( inode , EXT4_INODE_EXTENTS ) ) )
2010-03-04 16:14:02 -05:00
return 0 ;
if ( ext4_should_journal_data ( inode ) )
return 0 ;
return 1 ;
}
2008-04-29 18:13:32 -04:00
# endif /* _EXT4_JBD2_H */