2005-04-17 02:20:36 +04:00
/*
* Copyright ( C ) International Business Machines Corp . , 2000 - 2004
*
* This program is free software ; you can redistribute it and / or modify
* it under the terms of the GNU General Public License as published by
2006-10-02 18:55:27 +04:00
* the Free Software Foundation ; either version 2 of the License , or
2005-04-17 02:20:36 +04:00
* ( at your option ) any later version .
2006-10-02 18:55:27 +04:00
*
2005-04-17 02:20:36 +04:00
* This program is distributed in the hope that it will be useful ,
* but WITHOUT ANY WARRANTY ; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE . See
* the GNU General Public License for more details .
*
* You should have received a copy of the GNU General Public License
2006-10-02 18:55:27 +04:00
* along with this program ; if not , write to the Free Software
2005-04-17 02:20:36 +04:00
* Foundation , Inc . , 59 Temple Place , Suite 330 , Boston , MA 02111 - 1307 USA
*/
# include <linux/fs.h>
# include <linux/buffer_head.h>
# include <linux/quotaops.h>
# include "jfs_incore.h"
# include "jfs_filsys.h"
# include "jfs_metapage.h"
# include "jfs_dinode.h"
# include "jfs_imap.h"
# include "jfs_dmap.h"
# include "jfs_superblock.h"
# include "jfs_txnmgr.h"
# include "jfs_debug.h"
2007-06-07 00:28:35 +04:00
# define BITSPERPAGE (PSIZE << 3)
# define L2MEGABYTE 20
# define MEGABYTE (1 << L2MEGABYTE)
# define MEGABYTE32 (MEGABYTE << 5)
2005-04-17 02:20:36 +04:00
/* convert block number to bmap file page number */
# define BLKTODMAPN(b)\
2007-06-07 00:28:35 +04:00
( ( ( b ) > > 13 ) + ( ( b ) > > 23 ) + ( ( b ) > > 33 ) + 3 + 1 )
2005-04-17 02:20:36 +04:00
/*
2007-06-07 00:28:35 +04:00
* jfs_extendfs ( )
2005-04-17 02:20:36 +04:00
*
* function : extend file system ;
*
* | - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - | - - - - - - - - - - | - - - - - - - - - - |
* file system space fsck inline log
* workspace space
*
* input :
2007-06-07 00:28:35 +04:00
* new LVSize : in LV blocks ( required )
* new LogSize : in LV blocks ( optional )
* new FSSize : in LV blocks ( optional )
2005-04-17 02:20:36 +04:00
*
* new configuration :
* 1. set new LogSize as specified or default from new LVSize ;
* 2. compute new FSCKSize from new LVSize ;
* 3. set new FSSize as MIN ( FSSize , LVSize - ( LogSize + FSCKSize ) ) where
* assert ( new FSSize > = old FSSize ) ,
* i . e . , file system must not be shrinked ;
*/
int jfs_extendfs ( struct super_block * sb , s64 newLVSize , int newLogSize )
{
int rc = 0 ;
struct jfs_sb_info * sbi = JFS_SBI ( sb ) ;
struct inode * ipbmap = sbi - > ipbmap ;
struct inode * ipbmap2 ;
struct inode * ipimap = sbi - > ipimap ;
struct jfs_log * log = sbi - > log ;
struct bmap * bmp = sbi - > bmap ;
s64 newLogAddress , newFSCKAddress ;
int newFSCKSize ;
s64 newMapSize = 0 , mapSize ;
s64 XAddress , XSize , nblocks , xoff , xaddr , t64 ;
s64 oldLVSize ;
s64 newFSSize ;
s64 VolumeSize ;
int newNpages = 0 , nPages , newPage , xlen , t32 ;
int tid ;
int log_formatted = 0 ;
struct inode * iplist [ 1 ] ;
struct jfs_superblock * j_sb , * j_sb2 ;
uint old_agsize ;
2010-04-16 17:01:20 +04:00
int agsizechanged = 0 ;
2005-04-17 02:20:36 +04:00
struct buffer_head * bh , * bh2 ;
/* If the volume hasn't grown, get out now */
if ( sbi - > mntflag & JFS_INLINELOG )
oldLVSize = addressPXD ( & sbi - > logpxd ) + lengthPXD ( & sbi - > logpxd ) ;
else
oldLVSize = addressPXD ( & sbi - > fsckpxd ) +
lengthPXD ( & sbi - > fsckpxd ) ;
if ( oldLVSize > = newLVSize ) {
printk ( KERN_WARNING
" jfs_extendfs: volume hasn't grown, returning \n " ) ;
goto out ;
}
VolumeSize = sb - > s_bdev - > bd_inode - > i_size > > sb - > s_blocksize_bits ;
if ( VolumeSize ) {
if ( newLVSize > VolumeSize ) {
printk ( KERN_WARNING " jfs_extendfs: invalid size \n " ) ;
rc = - EINVAL ;
goto out ;
}
} else {
/* check the device */
bh = sb_bread ( sb , newLVSize - 1 ) ;
if ( ! bh ) {
printk ( KERN_WARNING " jfs_extendfs: invalid size \n " ) ;
rc = - EINVAL ;
goto out ;
}
bforget ( bh ) ;
}
/* Can't extend write-protected drive */
if ( isReadOnly ( ipbmap ) ) {
printk ( KERN_WARNING " jfs_extendfs: read-only file system \n " ) ;
rc = - EROFS ;
goto out ;
}
/*
2007-06-07 00:28:35 +04:00
* reconfigure LV spaces
* - - - - - - - - - - - - - - - - - - - - -
2005-04-17 02:20:36 +04:00
*
* validate new size , or , if not specified , determine new size
*/
/*
* reconfigure inline log space :
*/
if ( ( sbi - > mntflag & JFS_INLINELOG ) ) {
if ( newLogSize = = 0 ) {
/*
* no size specified : default to 1 / 256 of aggregate
* size ; rounded up to a megabyte boundary ;
*/
newLogSize = newLVSize > > 8 ;
t32 = ( 1 < < ( 20 - sbi - > l2bsize ) ) - 1 ;
newLogSize = ( newLogSize + t32 ) & ~ t32 ;
newLogSize =
min ( newLogSize , MEGABYTE32 > > sbi - > l2bsize ) ;
} else {
/*
* convert the newLogSize to fs blocks .
*
* Since this is given in megabytes , it will always be
* an even number of pages .
*/
newLogSize = ( newLogSize * MEGABYTE ) > > sbi - > l2bsize ;
}
} else
newLogSize = 0 ;
newLogAddress = newLVSize - newLogSize ;
/*
* reconfigure fsck work space :
*
* configure it to the end of the logical volume regardless of
* whether file system extends to the end of the aggregate ;
* Need enough 4 k pages to cover :
* - 1 bit per block in aggregate rounded up to BPERDMAP boundary
* - 1 extra page to handle control page and intermediate level pages
* - 50 extra pages for the chkdsk service log
*/
t64 = ( ( newLVSize - newLogSize + BPERDMAP - 1 ) > > L2BPERDMAP )
< < L2BPERDMAP ;
2007-08-31 21:57:28 +04:00
t32 = DIV_ROUND_UP ( t64 , BITSPERPAGE ) + 1 + 50 ;
2005-04-17 02:20:36 +04:00
newFSCKSize = t32 < < sbi - > l2nbperpage ;
newFSCKAddress = newLogAddress - newFSCKSize ;
/*
* compute new file system space ;
*/
newFSSize = newLVSize - newLogSize - newFSCKSize ;
/* file system cannot be shrinked */
if ( newFSSize < bmp - > db_mapsize ) {
rc = - EINVAL ;
goto out ;
}
/*
* If we ' re expanding enough that the inline log does not overlap
* the old one , we can format the new log before we quiesce the
* filesystem .
*/
if ( ( sbi - > mntflag & JFS_INLINELOG ) & & ( newLogAddress > oldLVSize ) ) {
if ( ( rc = lmLogFormat ( log , newLogAddress , newLogSize ) ) )
goto out ;
log_formatted = 1 ;
}
/*
2007-06-07 00:28:35 +04:00
* quiesce file system
2005-04-17 02:20:36 +04:00
*
* ( prepare to move the inline log and to prevent map update )
*
* block any new transactions and wait for completion of
* all wip transactions and flush modified pages s . t .
* on - disk file system is in consistent state and
* log is not required for recovery .
*/
txQuiesce ( sb ) ;
2005-05-02 22:25:02 +04:00
/* Reset size of direct inode */
sbi - > direct_inode - > i_size = sb - > s_bdev - > bd_inode - > i_size ;
2005-04-17 02:20:36 +04:00
if ( sbi - > mntflag & JFS_INLINELOG ) {
/*
* deactivate old inline log
*/
lmLogShutdown ( log ) ;
/*
* mark on - disk super block for fs in transition ;
*
* update on - disk superblock for the new space configuration
* of inline log space and fsck work space descriptors :
* N . B . FS descriptor is NOT updated ;
*
* crash recovery :
* logredo ( ) : if FM_EXTENDFS , return to fsck ( ) for cleanup ;
* fsck ( ) : if FM_EXTENDFS , reformat inline log and fsck
* workspace from superblock inline log descriptor and fsck
* workspace descriptor ;
*/
/* read in superblock */
if ( ( rc = readSuper ( sb , & bh ) ) )
goto error_out ;
j_sb = ( struct jfs_superblock * ) bh - > b_data ;
/* mark extendfs() in progress */
j_sb - > s_state | = cpu_to_le32 ( FM_EXTENDFS ) ;
j_sb - > s_xsize = cpu_to_le64 ( newFSSize ) ;
PXDaddress ( & j_sb - > s_xfsckpxd , newFSCKAddress ) ;
PXDlength ( & j_sb - > s_xfsckpxd , newFSCKSize ) ;
PXDaddress ( & j_sb - > s_xlogpxd , newLogAddress ) ;
PXDlength ( & j_sb - > s_xlogpxd , newLogSize ) ;
/* synchronously update superblock */
mark_buffer_dirty ( bh ) ;
sync_dirty_buffer ( bh ) ;
brelse ( bh ) ;
/*
* format new inline log synchronously ;
*
* crash recovery : if log move in progress ,
* reformat log and exit success ;
*/
if ( ! log_formatted )
if ( ( rc = lmLogFormat ( log , newLogAddress , newLogSize ) ) )
goto error_out ;
/*
* activate new log
*/
log - > base = newLogAddress ;
log - > size = newLogSize > > ( L2LOGPSIZE - sb - > s_blocksize_bits ) ;
if ( ( rc = lmLogInit ( log ) ) )
goto error_out ;
}
/*
2007-06-07 00:28:35 +04:00
* extend block allocation map
* - - - - - - - - - - - - - - - - - - - - - - - - - - -
2005-04-17 02:20:36 +04:00
*
* extendfs ( ) for new extension , retry after crash recovery ;
*
* note : both logredo ( ) and fsck ( ) rebuild map from
* the bitmap and configuration parameter from superblock
* ( disregarding all other control information in the map ) ;
*
* superblock :
* s_size : aggregate size in physical blocks ;
*/
/*
2007-06-07 00:28:35 +04:00
* compute the new block allocation map configuration
2005-04-17 02:20:36 +04:00
*
* map dinode :
* di_size : map file size in byte ;
* di_nblocks : number of blocks allocated for map file ;
* di_mapsize : number of blocks in aggregate ( covered by map ) ;
* map control page :
* db_mapsize : number of blocks in aggregate ( covered by map ) ;
*/
newMapSize = newFSSize ;
/* number of data pages of new bmap file:
* roundup new size to full dmap page boundary and
* add 1 extra dmap page for next extendfs ( )
*/
t64 = ( newMapSize - 1 ) + BPERDMAP ;
newNpages = BLKTODMAPN ( t64 ) + 1 ;
/*
2007-06-07 00:28:35 +04:00
* extend map from current map ( WITHOUT growing mapfile )
2005-04-17 02:20:36 +04:00
*
* map new extension with unmapped part of the last partial
* dmap page , if applicable , and extra page ( s ) allocated
* at end of bmap by mkfs ( ) or previous extendfs ( ) ;
*/
extendBmap :
/* compute number of blocks requested to extend */
mapSize = bmp - > db_mapsize ;
XAddress = mapSize ; /* eXtension Address */
XSize = newMapSize - mapSize ; /* eXtension Size */
old_agsize = bmp - > db_agsize ; /* We need to know if this changes */
/* compute number of blocks that can be extended by current mapfile */
t64 = dbMapFileSizeToMapSize ( ipbmap ) ;
if ( mapSize > t64 ) {
printk ( KERN_ERR " jfs_extendfs: mapSize (0x%Lx) > t64 (0x%Lx) \n " ,
( long long ) mapSize , ( long long ) t64 ) ;
rc = - EIO ;
goto error_out ;
}
nblocks = min ( t64 - mapSize , XSize ) ;
/*
* update map pages for new extension :
*
* update / init dmap and bubble up the control hierarchy
* incrementally fold up dmaps into upper levels ;
* update bmap control page ;
*/
if ( ( rc = dbExtendFS ( ipbmap , XAddress , nblocks ) ) )
goto error_out ;
2010-04-16 17:01:20 +04:00
agsizechanged | = ( bmp - > db_agsize ! = old_agsize ) ;
2005-04-17 02:20:36 +04:00
/*
* the map now has extended to cover additional nblocks :
* dn_mapsize = oldMapsize + nblocks ;
*/
/* ipbmap->i_mapsize += nblocks; */
XSize - = nblocks ;
/*
2007-06-07 00:28:35 +04:00
* grow map file to cover remaining extension
* and / or one extra dmap page for next extendfs ( ) ;
2005-04-17 02:20:36 +04:00
*
* allocate new map pages and its backing blocks , and
* update map file xtree
*/
/* compute number of data pages of current bmap file */
nPages = ipbmap - > i_size > > L2PSIZE ;
/* need to grow map file ? */
if ( nPages = = newNpages )
goto finalizeBmap ;
/*
* grow bmap file for the new map pages required :
*
* allocate growth at the start of newly extended region ;
* bmap file only grows sequentially , i . e . , both data pages
* and possibly xtree index pages may grow in append mode ,
* s . t . logredo ( ) can reconstruct pre - extension state
* by washing away bmap file of pages outside s_size boundary ;
*/
/*
* journal map file growth as if a regular file growth :
* ( note : bmap is created with di_mode = IFJOURNAL | IFREG ) ;
*
* journaling of bmap file growth is not required since
* logredo ( ) do / can not use log records of bmap file growth
* but it provides careful write semantics , pmap update , etc . ;
*/
/* synchronous write of data pages: bmap data pages are
* cached in meta - data cache , and not written out
* by txCommit ( ) ;
*/
filemap_fdatawait ( ipbmap - > i_mapping ) ;
[PATCH] Fix and add EXPORT_SYMBOL(filemap_write_and_wait)
This patch add EXPORT_SYMBOL(filemap_write_and_wait) and use it.
See mm/filemap.c:
And changes the filemap_write_and_wait() and filemap_write_and_wait_range().
Current filemap_write_and_wait() doesn't wait if filemap_fdatawrite()
returns error. However, even if filemap_fdatawrite() returned an
error, it may have submitted the partially data pages to the device.
(e.g. in the case of -ENOSPC)
<quotation>
Andrew Morton writes,
If filemap_fdatawrite() returns an error, this might be due to some
I/O problem: dead disk, unplugged cable, etc. Given the generally
crappy quality of the kernel's handling of such exceptions, there's a
good chance that the filemap_fdatawait() will get stuck in D state
forever.
</quotation>
So, this patch doesn't wait if filemap_fdatawrite() returns the -EIO.
Trond, could you please review the nfs part? Especially I'm not sure,
nfs must use the "filemap_fdatawrite(inode->i_mapping) == 0", or not.
Acked-by: Trond Myklebust <trond.myklebust@fys.uio.no>
Signed-off-by: Andrew Morton <akpm@osdl.org>
Signed-off-by: Linus Torvalds <torvalds@osdl.org>
2006-01-08 12:02:14 +03:00
filemap_write_and_wait ( ipbmap - > i_mapping ) ;
2005-04-17 02:20:36 +04:00
diWriteSpecial ( ipbmap , 0 ) ;
newPage = nPages ; /* first new page number */
xoff = newPage < < sbi - > l2nbperpage ;
xlen = ( newNpages - nPages ) < < sbi - > l2nbperpage ;
xlen = min ( xlen , ( int ) nblocks ) & ~ ( sbi - > nbperpage - 1 ) ;
xaddr = XAddress ;
tid = txBegin ( sb , COMMIT_FORCE ) ;
if ( ( rc = xtAppend ( tid , ipbmap , 0 , xoff , nblocks , & xlen , & xaddr , 0 ) ) ) {
txEnd ( tid ) ;
goto error_out ;
}
/* update bmap file size */
ipbmap - > i_size + = xlen < < sbi - > l2bsize ;
inode_add_bytes ( ipbmap , xlen < < sbi - > l2bsize ) ;
iplist [ 0 ] = ipbmap ;
rc = txCommit ( tid , 1 , & iplist [ 0 ] , COMMIT_FORCE ) ;
txEnd ( tid ) ;
if ( rc )
goto error_out ;
/*
* map file has been grown now to cover extension to further out ;
* di_size = new map file size ;
*
* if huge extension , the previous extension based on previous
* map file size may not have been sufficient to cover whole extension
* ( it could have been used up for new map pages ) ,
* but the newly grown map file now covers lot bigger new free space
* available for further extension of map ;
*/
/* any more blocks to extend ? */
if ( XSize )
goto extendBmap ;
finalizeBmap :
/* finalize bmap */
dbFinalizeBmap ( ipbmap ) ;
/*
2007-06-07 00:28:35 +04:00
* update inode allocation map
* - - - - - - - - - - - - - - - - - - - - - - - - - - -
2005-04-17 02:20:36 +04:00
*
* move iag lists from old to new iag ;
* agstart field is not updated for logredo ( ) to reconstruct
* iag lists if system crash occurs .
* ( computation of ag number from agstart based on agsize
* will correctly identify the new ag ) ;
*/
/* if new AG size the same as old AG size, done! */
2010-04-16 17:01:20 +04:00
if ( agsizechanged ) {
2005-04-17 02:20:36 +04:00
if ( ( rc = diExtendFS ( ipimap , ipbmap ) ) )
goto error_out ;
/* finalize imap */
if ( ( rc = diSync ( ipimap ) ) )
goto error_out ;
}
/*
2007-06-07 00:28:35 +04:00
* finalize
* - - - - - - - -
2005-04-17 02:20:36 +04:00
*
* extension is committed when on - disk super block is
* updated with new descriptors : logredo will recover
* crash before it to pre - extension state ;
*/
/* sync log to skip log replay of bmap file growth transaction; */
/* lmLogSync(log, 1); */
/*
* synchronous write bmap global control page ;
* for crash before completion of write
* logredo ( ) will recover to pre - extendfs state ;
* for crash after completion of write ,
* logredo ( ) will recover post - extendfs state ;
*/
if ( ( rc = dbSync ( ipbmap ) ) )
goto error_out ;
/*
* copy primary bmap inode to secondary bmap inode
*/
ipbmap2 = diReadSpecial ( sb , BMAP_I , 1 ) ;
if ( ipbmap2 = = NULL ) {
printk ( KERN_ERR " jfs_extendfs: diReadSpecial(bmap) failed \n " ) ;
goto error_out ;
}
memcpy ( & JFS_IP ( ipbmap2 ) - > i_xtroot , & JFS_IP ( ipbmap ) - > i_xtroot , 288 ) ;
ipbmap2 - > i_size = ipbmap - > i_size ;
ipbmap2 - > i_blocks = ipbmap - > i_blocks ;
diWriteSpecial ( ipbmap2 , 1 ) ;
diFreeSpecial ( ipbmap2 ) ;
/*
2007-06-07 00:28:35 +04:00
* update superblock
2005-04-17 02:20:36 +04:00
*/
if ( ( rc = readSuper ( sb , & bh ) ) )
goto error_out ;
j_sb = ( struct jfs_superblock * ) bh - > b_data ;
/* mark extendfs() completion */
j_sb - > s_state & = cpu_to_le32 ( ~ FM_EXTENDFS ) ;
j_sb - > s_size = cpu_to_le64 ( bmp - > db_mapsize < <
le16_to_cpu ( j_sb - > s_l2bfactor ) ) ;
j_sb - > s_agsize = cpu_to_le32 ( bmp - > db_agsize ) ;
/* update inline log space descriptor */
if ( sbi - > mntflag & JFS_INLINELOG ) {
PXDaddress ( & ( j_sb - > s_logpxd ) , newLogAddress ) ;
PXDlength ( & ( j_sb - > s_logpxd ) , newLogSize ) ;
}
/* record log's mount serial number */
j_sb - > s_logserial = cpu_to_le32 ( log - > serial ) ;
/* update fsck work space descriptor */
PXDaddress ( & ( j_sb - > s_fsckpxd ) , newFSCKAddress ) ;
PXDlength ( & ( j_sb - > s_fsckpxd ) , newFSCKSize ) ;
j_sb - > s_fscklog = 1 ;
/* sb->s_fsckloglen remains the same */
/* Update secondary superblock */
bh2 = sb_bread ( sb , SUPER2_OFF > > sb - > s_blocksize_bits ) ;
if ( bh2 ) {
j_sb2 = ( struct jfs_superblock * ) bh2 - > b_data ;
memcpy ( j_sb2 , j_sb , sizeof ( struct jfs_superblock ) ) ;
mark_buffer_dirty ( bh ) ;
sync_dirty_buffer ( bh2 ) ;
brelse ( bh2 ) ;
}
/* write primary superblock */
mark_buffer_dirty ( bh ) ;
sync_dirty_buffer ( bh ) ;
brelse ( bh ) ;
goto resume ;
error_out :
jfs_error ( sb , " jfs_extendfs " ) ;
resume :
/*
2007-06-07 00:28:35 +04:00
* resume file system transactions
2005-04-17 02:20:36 +04:00
*/
txResume ( sb ) ;
out :
return rc ;
}