2011-01-07 16:02:04 +03:00
/*
* Copyright ( C ) 2010 Red Hat , Inc .
* All Rights Reserved .
*
* This program is free software ; you can redistribute it and / or
* modify it under the terms of the GNU General Public License as
* published by the Free Software Foundation .
*
* This program is distributed in the hope that it would be useful ,
* but WITHOUT ANY WARRANTY ; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE . See the
* GNU General Public License for more details .
*
* You should have received a copy of the GNU General Public License
* along with this program ; if not , write the Free Software Foundation ,
* Inc . , 51 Franklin St , Fifth Floor , Boston , MA 02110 - 1301 USA
*/
# include "xfs.h"
2013-08-12 14:49:26 +04:00
# include "xfs_format.h"
2013-10-23 03:50:10 +04:00
# include "xfs_log_format.h"
# include "xfs_trans_resv.h"
2013-08-12 14:49:32 +04:00
# include "xfs_sb.h"
2011-01-07 16:02:04 +03:00
# include "xfs_mount.h"
# include "xfs_quota.h"
# include "xfs_inode.h"
2013-10-23 03:51:50 +04:00
# include "xfs_btree.h"
# include "xfs_alloc_btree.h"
2011-01-07 16:02:04 +03:00
# include "xfs_alloc.h"
# include "xfs_error.h"
2012-04-29 14:39:43 +04:00
# include "xfs_extent_busy.h"
2011-01-07 16:02:04 +03:00
# include "xfs_discard.h"
# include "xfs_trace.h"
2013-10-23 03:50:10 +04:00
# include "xfs_log.h"
2011-01-07 16:02:04 +03:00
STATIC int
xfs_trim_extents (
struct xfs_mount * mp ,
xfs_agnumber_t agno ,
2012-03-22 09:15:12 +04:00
xfs_daddr_t start ,
xfs_daddr_t end ,
xfs_daddr_t minlen ,
2017-06-16 21:00:05 +03:00
uint64_t * blocks_trimmed )
2011-01-07 16:02:04 +03:00
{
struct block_device * bdev = mp - > m_ddev_targp - > bt_bdev ;
struct xfs_btree_cur * cur ;
struct xfs_buf * agbp ;
struct xfs_perag * pag ;
int error ;
int i ;
pag = xfs_perag_get ( mp , agno ) ;
error = xfs_alloc_read_agf ( mp , NULL , agno , 0 , & agbp ) ;
if ( error | | ! agbp )
goto out_put_perag ;
cur = xfs_allocbt_init_cursor ( mp , NULL , agbp , agno , XFS_BTNUM_CNT ) ;
/*
* Force out the log . This means any transactions that might have freed
* space before we took the AGF buffer lock are now on disk , and the
* volatile disk cache is flushed .
*/
xfs_log_force ( mp , XFS_LOG_SYNC ) ;
/*
* Look up the longest btree in the AGF and start with it .
*/
2012-03-22 09:15:12 +04:00
error = xfs_alloc_lookup_ge ( cur , 0 ,
2011-12-21 04:07:42 +04:00
be32_to_cpu ( XFS_BUF_TO_AGF ( agbp ) - > agf_longest ) , & i ) ;
2011-01-07 16:02:04 +03:00
if ( error )
goto out_del_cursor ;
/*
* Loop until we are done with all extents that are large
* enough to be worth discarding .
*/
while ( i ) {
2012-03-22 09:15:12 +04:00
xfs_agblock_t fbno ;
xfs_extlen_t flen ;
xfs_daddr_t dbno ;
xfs_extlen_t dlen ;
2011-01-07 16:02:04 +03:00
error = xfs_alloc_get_rec ( cur , & fbno , & flen , & i ) ;
if ( error )
goto out_del_cursor ;
2015-02-23 14:39:08 +03:00
XFS_WANT_CORRUPTED_GOTO ( mp , i = = 1 , out_del_cursor ) ;
2011-12-21 04:07:42 +04:00
ASSERT ( flen < = be32_to_cpu ( XFS_BUF_TO_AGF ( agbp ) - > agf_longest ) ) ;
2011-01-07 16:02:04 +03:00
2012-03-22 09:15:12 +04:00
/*
* use daddr format for all range / len calculations as that is
* the format the range / len variables are supplied in by
* userspace .
*/
dbno = XFS_AGB_TO_DADDR ( mp , agno , fbno ) ;
dlen = XFS_FSB_TO_BB ( mp , flen ) ;
2011-01-07 16:02:04 +03:00
/*
* Too small ? Give up .
*/
2012-03-22 09:15:12 +04:00
if ( dlen < minlen ) {
2011-01-07 16:02:04 +03:00
trace_xfs_discard_toosmall ( mp , agno , fbno , flen ) ;
goto out_del_cursor ;
}
/*
* If the extent is entirely outside of the range we are
* supposed to discard skip it . Do not bother to trim
* down partially overlapping ranges for now .
*/
2012-03-22 09:15:12 +04:00
if ( dbno + dlen < start | | dbno > end ) {
2011-01-07 16:02:04 +03:00
trace_xfs_discard_exclude ( mp , agno , fbno , flen ) ;
goto next_extent ;
}
/*
* If any blocks in the range are still busy , skip the
* discard and try again the next time .
*/
2012-04-29 14:41:10 +04:00
if ( xfs_extent_busy_search ( mp , agno , fbno , flen ) ) {
2011-01-07 16:02:04 +03:00
trace_xfs_discard_busy ( mp , agno , fbno , flen ) ;
goto next_extent ;
}
trace_xfs_discard_extent ( mp , agno , fbno , flen ) ;
2014-06-25 08:58:08 +04:00
error = blkdev_issue_discard ( bdev , dbno , dlen , GFP_NOFS , 0 ) ;
2011-01-07 16:02:04 +03:00
if ( error )
goto out_del_cursor ;
* blocks_trimmed + = flen ;
next_extent :
error = xfs_btree_decrement ( cur , 0 , & i ) ;
if ( error )
goto out_del_cursor ;
2017-04-27 18:59:36 +03:00
if ( fatal_signal_pending ( current ) ) {
error = - ERESTARTSYS ;
goto out_del_cursor ;
}
2011-01-07 16:02:04 +03:00
}
out_del_cursor :
xfs_btree_del_cursor ( cur , error ? XFS_BTREE_ERROR : XFS_BTREE_NOERROR ) ;
xfs_buf_relse ( agbp ) ;
out_put_perag :
xfs_perag_put ( pag ) ;
return error ;
}
2012-03-22 09:15:12 +04:00
/*
* trim a range of the filesystem .
*
* Note : the parameters passed from userspace are byte ranges into the
* filesystem which does not match to the format we use for filesystem block
* addressing . FSB addressing is sparse ( AGNO | AGBNO ) , while the incoming format
* is a linear address range . Hence we need to use DADDR based conversions and
* comparisons for determining the correct offset and regions to trim .
*/
2011-01-07 16:02:04 +03:00
int
xfs_ioc_trim (
struct xfs_mount * mp ,
struct fstrim_range __user * urange )
{
2013-11-20 12:08:53 +04:00
struct request_queue * q = bdev_get_queue ( mp - > m_ddev_targp - > bt_bdev ) ;
2011-01-07 16:02:04 +03:00
unsigned int granularity = q - > limits . discard_granularity ;
struct fstrim_range range ;
2012-03-22 09:15:12 +04:00
xfs_daddr_t start , end , minlen ;
2011-01-07 16:02:04 +03:00
xfs_agnumber_t start_agno , end_agno , agno ;
2017-06-16 21:00:05 +03:00
uint64_t blocks_trimmed = 0 ;
2011-01-07 16:02:04 +03:00
int error , last_error = 0 ;
if ( ! capable ( CAP_SYS_ADMIN ) )
2014-06-22 09:04:54 +04:00
return - EPERM ;
2011-02-15 20:07:36 +03:00
if ( ! blk_queue_discard ( q ) )
2014-06-22 09:04:54 +04:00
return - EOPNOTSUPP ;
2011-01-07 16:02:04 +03:00
if ( copy_from_user ( & range , urange , sizeof ( range ) ) )
2014-06-22 09:04:54 +04:00
return - EFAULT ;
2011-01-07 16:02:04 +03:00
/*
* Truncating down the len isn ' t actually quite correct , but using
2012-03-22 09:15:12 +04:00
* BBTOB would mean we trivially get overflows for values
2011-01-07 16:02:04 +03:00
* of ULLONG_MAX or slightly lower . And ULLONG_MAX is the default
* used by the fstrim application . In the end it really doesn ' t
* matter as trimming blocks is an advisory interface .
*/
2012-08-14 12:35:04 +04:00
if ( range . start > = XFS_FSB_TO_B ( mp , mp - > m_sb . sb_dblocks ) | |
2016-08-03 04:38:24 +03:00
range . minlen > XFS_FSB_TO_B ( mp , mp - > m_ag_max_usable ) | |
2013-11-20 12:08:53 +04:00
range . len < mp - > m_sb . sb_blocksize )
2014-06-22 09:04:54 +04:00
return - EINVAL ;
2012-08-14 12:35:04 +04:00
2012-03-22 09:15:12 +04:00
start = BTOBB ( range . start ) ;
end = start + BTOBBT ( range . len ) - 1 ;
minlen = BTOBB ( max_t ( u64 , granularity , range . minlen ) ) ;
2011-01-07 16:02:04 +03:00
2012-03-22 09:15:12 +04:00
if ( end > XFS_FSB_TO_BB ( mp , mp - > m_sb . sb_dblocks ) - 1 )
end = XFS_FSB_TO_BB ( mp , mp - > m_sb . sb_dblocks ) - 1 ;
2011-01-07 16:02:04 +03:00
2012-03-22 09:15:12 +04:00
start_agno = xfs_daddr_to_agno ( mp , start ) ;
end_agno = xfs_daddr_to_agno ( mp , end ) ;
2011-01-07 16:02:04 +03:00
for ( agno = start_agno ; agno < = end_agno ; agno + + ) {
2014-06-25 08:58:08 +04:00
error = xfs_trim_extents ( mp , agno , start , end , minlen ,
2011-01-07 16:02:04 +03:00
& blocks_trimmed ) ;
2017-04-27 18:59:36 +03:00
if ( error ) {
2011-01-07 16:02:04 +03:00
last_error = error ;
2017-04-27 18:59:36 +03:00
if ( error = = - ERESTARTSYS )
break ;
}
2011-01-07 16:02:04 +03:00
}
if ( last_error )
return last_error ;
range . len = XFS_FSB_TO_B ( mp , blocks_trimmed ) ;
if ( copy_to_user ( urange , & range , sizeof ( range ) ) )
2014-06-22 09:04:54 +04:00
return - EFAULT ;
2011-01-07 16:02:04 +03:00
return 0 ;
}