2008-01-29 14:04:06 +01:00
/*
* Functions related to segment and merge handling
*/
# include <linux/kernel.h>
# include <linux/module.h>
# include <linux/bio.h>
# include <linux/blkdev.h>
# include <linux/scatterlist.h>
2015-12-03 17:32:30 +03:00
# include <trace/events/block.h>
2008-01-29 14:04:06 +01:00
# include "blk.h"
2015-04-23 22:37:18 -07:00
static struct bio * blk_bio_discard_split ( struct request_queue * q ,
struct bio * bio ,
2015-10-20 23:13:52 +08:00
struct bio_set * bs ,
unsigned * nsegs )
2015-04-23 22:37:18 -07:00
{
unsigned int max_discard_sectors , granularity ;
int alignment ;
sector_t tmp ;
unsigned split_sectors ;
2015-10-20 23:13:52 +08:00
* nsegs = 1 ;
2015-04-23 22:37:18 -07:00
/* Zero-sector (unknown) and one-sector granularities are the same. */
granularity = max ( q - > limits . discard_granularity > > 9 , 1U ) ;
max_discard_sectors = min ( q - > limits . max_discard_sectors , UINT_MAX > > 9 ) ;
max_discard_sectors - = max_discard_sectors % granularity ;
if ( unlikely ( ! max_discard_sectors ) ) {
/* XXX: warn */
return NULL ;
}
if ( bio_sectors ( bio ) < = max_discard_sectors )
return NULL ;
split_sectors = max_discard_sectors ;
/*
* If the next starting sector would be misaligned , stop the discard at
* the previous aligned sector .
*/
alignment = ( q - > limits . discard_alignment > > 9 ) % granularity ;
tmp = bio - > bi_iter . bi_sector + split_sectors - alignment ;
tmp = sector_div ( tmp , granularity ) ;
if ( split_sectors > tmp )
split_sectors - = tmp ;
return bio_split ( bio , split_sectors , GFP_NOIO , bs ) ;
}
static struct bio * blk_bio_write_same_split ( struct request_queue * q ,
struct bio * bio ,
2015-10-20 23:13:52 +08:00
struct bio_set * bs ,
unsigned * nsegs )
2015-04-23 22:37:18 -07:00
{
2015-10-20 23:13:52 +08:00
* nsegs = 1 ;
2015-04-23 22:37:18 -07:00
if ( ! q - > limits . max_write_same_sectors )
return NULL ;
if ( bio_sectors ( bio ) < = q - > limits . max_write_same_sectors )
return NULL ;
return bio_split ( bio , q - > limits . max_write_same_sectors , GFP_NOIO , bs ) ;
}
2016-01-23 08:05:33 +08:00
static inline unsigned get_max_io_size ( struct request_queue * q ,
struct bio * bio )
{
unsigned sectors = blk_max_size_offset ( q , bio - > bi_iter . bi_sector ) ;
unsigned mask = queue_logical_block_size ( q ) - 1 ;
/* aligned to logical block size */
sectors & = ~ ( mask > > 9 ) ;
return sectors ;
}
2015-04-23 22:37:18 -07:00
static struct bio * blk_bio_segment_split ( struct request_queue * q ,
struct bio * bio ,
2015-10-20 23:13:52 +08:00
struct bio_set * bs ,
unsigned * segs )
2015-04-23 22:37:18 -07:00
{
2015-09-02 16:46:02 -06:00
struct bio_vec bv , bvprv , * bvprvp = NULL ;
2015-04-23 22:37:18 -07:00
struct bvec_iter iter ;
2015-04-27 23:48:34 -07:00
unsigned seg_size = 0 , nsegs = 0 , sectors = 0 ;
2015-11-24 10:35:30 +08:00
unsigned front_seg_size = bio - > bi_seg_front_size ;
bool do_split = true ;
struct bio * new = NULL ;
2016-01-23 08:05:33 +08:00
const unsigned max_sectors = get_max_io_size ( q , bio ) ;
2016-08-23 21:49:45 +08:00
unsigned bvecs = 0 ;
2015-04-23 22:37:18 -07:00
bio_for_each_segment ( bv , bio , iter ) {
2016-08-23 21:49:45 +08:00
/*
* With arbitrary bio size , the incoming bio may be very
* big . We have to split the bio into small bios so that
* each holds at most BIO_MAX_PAGES bvecs because
* bio_clone ( ) can fail to allocate big bvecs .
*
* It should have been better to apply the limit per
* request queue in which bio_clone ( ) is involved ,
* instead of globally . The biggest blocker is the
* bio_clone ( ) in bio bounce .
*
* If bio is splitted by this reason , we should have
* allowed to continue bios merging , but don ' t do
* that now for making the change simple .
*
* TODO : deal with bio bounce ' s bio_clone ( ) gracefully
* and convert the global limit into per - queue limit .
*/
if ( bvecs + + > = BIO_MAX_PAGES )
goto split ;
2015-04-23 22:37:18 -07:00
/*
* If the queue doesn ' t support SG gaps and adding this
* offset would create a gap , disallow it .
*/
2015-09-02 16:46:02 -06:00
if ( bvprvp & & bvec_gap_to_prev ( q , bvprvp , bv . bv_offset ) )
2015-04-23 22:37:18 -07:00
goto split ;
2016-01-23 08:05:33 +08:00
if ( sectors + ( bv . bv_len > > 9 ) > max_sectors ) {
2016-01-12 15:08:39 -07:00
/*
* Consider this a new segment if we ' re splitting in
* the middle of this vector .
*/
if ( nsegs < queue_max_segments ( q ) & &
2016-01-23 08:05:33 +08:00
sectors < max_sectors ) {
2016-01-12 15:08:39 -07:00
nsegs + + ;
2016-01-23 08:05:33 +08:00
sectors = max_sectors ;
2016-01-12 15:08:39 -07:00
}
2016-01-23 08:05:33 +08:00
if ( sectors )
goto split ;
/* Make this single bvec as the 1st segment */
2016-01-12 15:08:39 -07:00
}
2015-09-02 16:46:02 -06:00
if ( bvprvp & & blk_queue_cluster ( q ) ) {
2015-04-23 22:37:18 -07:00
if ( seg_size + bv . bv_len > queue_max_segment_size ( q ) )
goto new_segment ;
2015-09-02 16:46:02 -06:00
if ( ! BIOVEC_PHYS_MERGEABLE ( bvprvp , & bv ) )
2015-04-23 22:37:18 -07:00
goto new_segment ;
2015-09-02 16:46:02 -06:00
if ( ! BIOVEC_SEG_BOUNDARY ( q , bvprvp , & bv ) )
2015-04-23 22:37:18 -07:00
goto new_segment ;
seg_size + = bv . bv_len ;
bvprv = bv ;
2015-11-24 10:35:29 +08:00
bvprvp = & bvprv ;
2015-09-17 09:58:38 -06:00
sectors + = bv . bv_len > > 9 ;
2015-11-30 16:05:49 +08:00
if ( nsegs = = 1 & & seg_size > front_seg_size )
front_seg_size = seg_size ;
2015-04-23 22:37:18 -07:00
continue ;
}
new_segment :
if ( nsegs = = queue_max_segments ( q ) )
goto split ;
nsegs + + ;
bvprv = bv ;
2015-11-24 10:35:29 +08:00
bvprvp = & bvprv ;
2015-04-23 22:37:18 -07:00
seg_size = bv . bv_len ;
2015-09-17 09:58:38 -06:00
sectors + = bv . bv_len > > 9 ;
2015-11-24 10:35:30 +08:00
if ( nsegs = = 1 & & seg_size > front_seg_size )
front_seg_size = seg_size ;
2015-04-23 22:37:18 -07:00
}
2015-11-24 10:35:30 +08:00
do_split = false ;
2015-04-23 22:37:18 -07:00
split :
2015-10-20 23:13:52 +08:00
* segs = nsegs ;
2015-11-24 10:35:30 +08:00
if ( do_split ) {
new = bio_split ( bio , sectors , GFP_NOIO , bs ) ;
if ( new )
bio = new ;
}
bio - > bi_seg_front_size = front_seg_size ;
if ( seg_size > bio - > bi_seg_back_size )
bio - > bi_seg_back_size = seg_size ;
return do_split ? new : NULL ;
2015-04-23 22:37:18 -07:00
}
void blk_queue_split ( struct request_queue * q , struct bio * * bio ,
struct bio_set * bs )
{
2015-10-20 23:13:52 +08:00
struct bio * split , * res ;
unsigned nsegs ;
2015-04-23 22:37:18 -07:00
2016-08-16 10:59:35 +03:00
switch ( bio_op ( * bio ) ) {
case REQ_OP_DISCARD :
case REQ_OP_SECURE_ERASE :
2015-10-20 23:13:52 +08:00
split = blk_bio_discard_split ( q , * bio , bs , & nsegs ) ;
2016-08-16 10:59:35 +03:00
break ;
2016-11-30 12:28:59 -08:00
case REQ_OP_WRITE_ZEROES :
split = NULL ;
nsegs = ( * bio ) - > bi_phys_segments ;
break ;
2016-08-16 10:59:35 +03:00
case REQ_OP_WRITE_SAME :
2015-10-20 23:13:52 +08:00
split = blk_bio_write_same_split ( q , * bio , bs , & nsegs ) ;
2016-08-16 10:59:35 +03:00
break ;
default :
2015-10-20 23:13:52 +08:00
split = blk_bio_segment_split ( q , * bio , q - > bio_split , & nsegs ) ;
2016-08-16 10:59:35 +03:00
break ;
}
2015-10-20 23:13:52 +08:00
/* physical segments can be figured out during splitting */
res = split ? split : * bio ;
res - > bi_phys_segments = nsegs ;
bio_set_flag ( res , BIO_SEG_VALID ) ;
2015-04-23 22:37:18 -07:00
if ( split ) {
2015-10-20 23:13:53 +08:00
/* there isn't chance to merge the splitted bio */
2016-08-05 15:35:16 -06:00
split - > bi_opf | = REQ_NOMERGE ;
2015-10-20 23:13:53 +08:00
2015-04-23 22:37:18 -07:00
bio_chain ( split , * bio ) ;
2015-12-03 17:32:30 +03:00
trace_block_split ( q , split , ( * bio ) - > bi_iter . bi_sector ) ;
2015-04-23 22:37:18 -07:00
generic_make_request ( * bio ) ;
* bio = split ;
}
}
EXPORT_SYMBOL ( blk_queue_split ) ;
2009-02-23 09:03:10 +01:00
static unsigned int __blk_recalc_rq_segments ( struct request_queue * q ,
2014-09-02 23:02:59 +08:00
struct bio * bio ,
bool no_sg_merge )
2008-01-29 14:04:06 +01:00
{
2013-11-23 17:19:00 -08:00
struct bio_vec bv , bvprv = { NULL } ;
2015-04-23 22:37:18 -07:00
int cluster , prev = 0 ;
2009-02-23 09:03:10 +01:00
unsigned int seg_size , nr_phys_segs ;
2009-03-06 08:55:24 +01:00
struct bio * fbio , * bbio ;
2013-11-23 17:19:00 -08:00
struct bvec_iter iter ;
2008-01-29 14:04:06 +01:00
2009-02-23 09:03:10 +01:00
if ( ! bio )
return 0 ;
2008-01-29 14:04:06 +01:00
2016-11-30 12:28:59 -08:00
switch ( bio_op ( bio ) ) {
case REQ_OP_DISCARD :
case REQ_OP_SECURE_ERASE :
case REQ_OP_WRITE_ZEROES :
2016-12-08 15:20:32 -07:00
return 0 ;
case REQ_OP_WRITE_SAME :
2014-02-07 13:53:46 -07:00
return 1 ;
2016-11-30 12:28:59 -08:00
}
2014-02-07 13:53:46 -07:00
2009-02-23 09:03:10 +01:00
fbio = bio ;
2010-12-01 19:41:49 +01:00
cluster = blk_queue_cluster ( q ) ;
2008-08-15 10:20:02 +02:00
seg_size = 0 ;
2010-06-21 11:02:47 +02:00
nr_phys_segs = 0 ;
2009-02-23 09:03:10 +01:00
for_each_bio ( bio ) {
2013-11-23 17:19:00 -08:00
bio_for_each_segment ( bv , bio , iter ) {
2014-05-29 09:53:32 -06:00
/*
* If SG merging is disabled , each bio vector is
* a segment
*/
if ( no_sg_merge )
goto new_segment ;
2015-04-23 22:37:18 -07:00
if ( prev & & cluster ) {
2013-11-23 17:19:00 -08:00
if ( seg_size + bv . bv_len
2009-05-22 17:17:50 -04:00
> queue_max_segment_size ( q ) )
2009-02-23 09:03:10 +01:00
goto new_segment ;
2013-11-23 17:19:00 -08:00
if ( ! BIOVEC_PHYS_MERGEABLE ( & bvprv , & bv ) )
2009-02-23 09:03:10 +01:00
goto new_segment ;
2013-11-23 17:19:00 -08:00
if ( ! BIOVEC_SEG_BOUNDARY ( q , & bvprv , & bv ) )
2009-02-23 09:03:10 +01:00
goto new_segment ;
2008-01-29 14:04:06 +01:00
2013-11-23 17:19:00 -08:00
seg_size + = bv . bv_len ;
2009-02-23 09:03:10 +01:00
bvprv = bv ;
continue ;
}
2008-01-29 14:04:06 +01:00
new_segment :
2009-02-23 09:03:10 +01:00
if ( nr_phys_segs = = 1 & & seg_size >
fbio - > bi_seg_front_size )
fbio - > bi_seg_front_size = seg_size ;
2008-10-13 14:19:05 +02:00
2009-02-23 09:03:10 +01:00
nr_phys_segs + + ;
bvprv = bv ;
2015-04-23 22:37:18 -07:00
prev = 1 ;
2013-11-23 17:19:00 -08:00
seg_size = bv . bv_len ;
2009-02-23 09:03:10 +01:00
}
2009-03-06 08:55:24 +01:00
bbio = bio ;
2008-01-29 14:04:06 +01:00
}
2009-03-06 08:55:24 +01:00
if ( nr_phys_segs = = 1 & & seg_size > fbio - > bi_seg_front_size )
fbio - > bi_seg_front_size = seg_size ;
if ( seg_size > bbio - > bi_seg_back_size )
bbio - > bi_seg_back_size = seg_size ;
2009-02-23 09:03:10 +01:00
return nr_phys_segs ;
}
void blk_recalc_rq_segments ( struct request * rq )
{
2014-09-02 23:02:59 +08:00
bool no_sg_merge = ! ! test_bit ( QUEUE_FLAG_NO_SG_MERGE ,
& rq - > q - > queue_flags ) ;
rq - > nr_phys_segments = __blk_recalc_rq_segments ( rq - > q , rq - > bio ,
no_sg_merge ) ;
2008-01-29 14:04:06 +01:00
}
void blk_recount_segments ( struct request_queue * q , struct bio * bio )
{
2014-11-12 00:15:41 +08:00
unsigned short seg_cnt ;
/* estimate segment number by bi_vcnt for non-cloned bio */
if ( bio_flagged ( bio , BIO_CLONED ) )
seg_cnt = bio_segments ( bio ) ;
else
seg_cnt = bio - > bi_vcnt ;
2014-10-09 23:17:35 +08:00
2014-11-12 00:15:41 +08:00
if ( test_bit ( QUEUE_FLAG_NO_SG_MERGE , & q - > queue_flags ) & &
( seg_cnt < queue_max_segments ( q ) ) )
bio - > bi_phys_segments = seg_cnt ;
2014-05-29 09:53:32 -06:00
else {
struct bio * nxt = bio - > bi_next ;
bio - > bi_next = NULL ;
2014-11-12 00:15:41 +08:00
bio - > bi_phys_segments = __blk_recalc_rq_segments ( q , bio , false ) ;
2014-05-29 09:53:32 -06:00
bio - > bi_next = nxt ;
}
2009-02-23 09:03:10 +01:00
2015-07-24 12:37:59 -06:00
bio_set_flag ( bio , BIO_SEG_VALID ) ;
2008-01-29 14:04:06 +01:00
}
EXPORT_SYMBOL ( blk_recount_segments ) ;
static int blk_phys_contig_segment ( struct request_queue * q , struct bio * bio ,
struct bio * nxt )
{
2013-12-03 14:29:09 -07:00
struct bio_vec end_bv = { NULL } , nxt_bv ;
2013-08-07 14:30:33 -07:00
2010-12-01 19:41:49 +01:00
if ( ! blk_queue_cluster ( q ) )
2008-01-29 14:04:06 +01:00
return 0 ;
2008-10-13 14:19:05 +02:00
if ( bio - > bi_seg_back_size + nxt - > bi_seg_front_size >
2009-05-22 17:17:50 -04:00
queue_max_segment_size ( q ) )
2008-01-29 14:04:06 +01:00
return 0 ;
2008-08-09 16:42:20 +01:00
if ( ! bio_has_data ( bio ) )
return 1 ;
2016-02-26 23:40:53 +08:00
bio_get_last_bvec ( bio , & end_bv ) ;
bio_get_first_bvec ( nxt , & nxt_bv ) ;
2013-08-07 14:30:33 -07:00
if ( ! BIOVEC_PHYS_MERGEABLE ( & end_bv , & nxt_bv ) )
2008-08-09 16:42:20 +01:00
return 0 ;
2008-01-29 14:04:06 +01:00
/*
2008-08-09 16:42:20 +01:00
* bio and nxt are contiguous in memory ; check if the queue allows
2008-01-29 14:04:06 +01:00
* these two to be merged into one
*/
2013-08-07 14:30:33 -07:00
if ( BIOVEC_SEG_BOUNDARY ( q , & end_bv , & nxt_bv ) )
2008-01-29 14:04:06 +01:00
return 1 ;
return 0 ;
}
2013-11-23 17:19:00 -08:00
static inline void
2012-08-02 23:42:03 +02:00
__blk_segment_map_sg ( struct request_queue * q , struct bio_vec * bvec ,
2013-11-23 17:19:00 -08:00
struct scatterlist * sglist , struct bio_vec * bvprv ,
2012-08-02 23:42:03 +02:00
struct scatterlist * * sg , int * nsegs , int * cluster )
{
int nbytes = bvec - > bv_len ;
2013-11-23 17:19:00 -08:00
if ( * sg & & * cluster ) {
2012-08-02 23:42:03 +02:00
if ( ( * sg ) - > length + nbytes > queue_max_segment_size ( q ) )
goto new_segment ;
2013-11-23 17:19:00 -08:00
if ( ! BIOVEC_PHYS_MERGEABLE ( bvprv , bvec ) )
2012-08-02 23:42:03 +02:00
goto new_segment ;
2013-11-23 17:19:00 -08:00
if ( ! BIOVEC_SEG_BOUNDARY ( q , bvprv , bvec ) )
2012-08-02 23:42:03 +02:00
goto new_segment ;
( * sg ) - > length + = nbytes ;
} else {
new_segment :
if ( ! * sg )
* sg = sglist ;
else {
/*
* If the driver previously mapped a shorter
* list , we could see a termination bit
* prematurely unless it fully inits the sg
* table on each mapping . We KNOW that there
* must be more entries here or the driver
* would be buggy , so force clear the
* termination bit to avoid doing a full
* sg_init_table ( ) in drivers for each command .
*/
2013-03-20 15:37:08 +10:30
sg_unmark_end ( * sg ) ;
2012-08-02 23:42:03 +02:00
* sg = sg_next ( * sg ) ;
}
sg_set_page ( * sg , bvec - > bv_page , nbytes , bvec - > bv_offset ) ;
( * nsegs ) + + ;
}
2013-11-23 17:19:00 -08:00
* bvprv = * bvec ;
2012-08-02 23:42:03 +02:00
}
2016-12-08 15:20:32 -07:00
static inline int __blk_bvec_map_sg ( struct request_queue * q , struct bio_vec bv ,
struct scatterlist * sglist , struct scatterlist * * sg )
{
* sg = sglist ;
sg_set_page ( * sg , bv . bv_page , bv . bv_len , bv . bv_offset ) ;
return 1 ;
}
2014-02-07 13:53:46 -07:00
static int __blk_bios_map_sg ( struct request_queue * q , struct bio * bio ,
struct scatterlist * sglist ,
struct scatterlist * * sg )
2008-01-29 14:04:06 +01:00
{
2013-12-03 14:29:09 -07:00
struct bio_vec bvec , bvprv = { NULL } ;
2014-02-07 13:53:46 -07:00
struct bvec_iter iter ;
2016-12-08 15:20:32 -07:00
int cluster = blk_queue_cluster ( q ) , nsegs = 0 ;
2014-02-07 13:53:46 -07:00
for_each_bio ( bio )
bio_for_each_segment ( bvec , bio , iter )
__blk_segment_map_sg ( q , & bvec , sglist , & bvprv , sg ,
& nsegs , & cluster ) ;
2008-01-29 14:04:06 +01:00
2014-02-07 13:53:46 -07:00
return nsegs ;
}
/*
* map a request to scatterlist , return number of sg entries setup . Caller
* must make sure sg can hold rq - > nr_phys_segments entries
*/
int blk_rq_map_sg ( struct request_queue * q , struct request * rq ,
struct scatterlist * sglist )
{
struct scatterlist * sg = NULL ;
int nsegs = 0 ;
2016-12-08 15:20:32 -07:00
if ( rq - > rq_flags & RQF_SPECIAL_PAYLOAD )
nsegs = __blk_bvec_map_sg ( q , rq - > special_vec , sglist , & sg ) ;
else if ( rq - > bio & & bio_op ( rq - > bio ) = = REQ_OP_WRITE_SAME )
nsegs = __blk_bvec_map_sg ( q , bio_iovec ( rq - > bio ) , sglist , & sg ) ;
else if ( rq - > bio )
2014-02-07 13:53:46 -07:00
nsegs = __blk_bios_map_sg ( q , rq - > bio , sglist , & sg ) ;
2008-04-11 12:56:52 +02:00
2016-10-20 15:12:13 +02:00
if ( unlikely ( rq - > rq_flags & RQF_COPY_USER ) & &
2009-05-07 22:24:41 +09:00
( blk_rq_bytes ( rq ) & q - > dma_pad_mask ) ) {
unsigned int pad_len =
( q - > dma_pad_mask & ~ blk_rq_bytes ( rq ) ) + 1 ;
2008-04-11 12:56:52 +02:00
sg - > length + = pad_len ;
rq - > extra_len + = pad_len ;
}
2008-02-19 11:36:53 +01:00
if ( q - > dma_drain_size & & q - > dma_drain_needed ( rq ) ) {
2016-06-05 14:31:45 -05:00
if ( op_is_write ( req_op ( rq ) ) )
2008-02-19 11:36:55 +01:00
memset ( q - > dma_drain_buffer , 0 , q - > dma_drain_size ) ;
2015-08-07 18:15:14 +02:00
sg_unmark_end ( sg ) ;
2008-01-29 14:04:06 +01:00
sg = sg_next ( sg ) ;
sg_set_page ( sg , virt_to_page ( q - > dma_drain_buffer ) ,
q - > dma_drain_size ,
( ( unsigned long ) q - > dma_drain_buffer ) &
( PAGE_SIZE - 1 ) ) ;
nsegs + + ;
2008-03-04 11:17:11 +01:00
rq - > extra_len + = q - > dma_drain_size ;
2008-01-29 14:04:06 +01:00
}
if ( sg )
sg_mark_end ( sg ) ;
2015-11-24 10:35:31 +08:00
/*
* Something must have been wrong if the figured number of
* segment is bigger than number of req ' s physical segments
*/
2016-12-08 15:20:32 -07:00
WARN_ON ( nsegs > blk_rq_nr_phys_segments ( rq ) ) ;
2015-11-24 10:35:31 +08:00
2008-01-29 14:04:06 +01:00
return nsegs ;
}
EXPORT_SYMBOL ( blk_rq_map_sg ) ;
static inline int ll_new_hw_segment ( struct request_queue * q ,
struct request * req ,
struct bio * bio )
{
int nr_phys_segs = bio_phys_segments ( q , bio ) ;
2010-09-10 20:50:10 +02:00
if ( req - > nr_phys_segments + nr_phys_segs > queue_max_segments ( q ) )
goto no_merge ;
2014-09-26 19:20:06 -04:00
if ( blk_integrity_merge_bio ( q , req , bio ) = = false )
2010-09-10 20:50:10 +02:00
goto no_merge ;
2008-01-29 14:04:06 +01:00
/*
* This will form the start of a new hw segment . Bump both
* counters .
*/
req - > nr_phys_segments + = nr_phys_segs ;
return 1 ;
2010-09-10 20:50:10 +02:00
no_merge :
2016-12-01 08:36:16 -07:00
req_set_nomerge ( q , req ) ;
2010-09-10 20:50:10 +02:00
return 0 ;
2008-01-29 14:04:06 +01:00
}
int ll_back_merge_fn ( struct request_queue * q , struct request * req ,
struct bio * bio )
{
2015-09-03 19:28:20 +03:00
if ( req_gap_back_merge ( req , bio ) )
return 0 ;
2015-09-11 09:03:04 -06:00
if ( blk_integrity_rq ( req ) & &
integrity_req_gap_back_merge ( req , bio ) )
return 0 ;
2012-09-18 12:19:26 -04:00
if ( blk_rq_sectors ( req ) + bio_sectors ( bio ) >
2016-07-20 21:40:47 -06:00
blk_rq_get_max_sectors ( req , blk_rq_pos ( req ) ) ) {
2016-12-01 08:36:16 -07:00
req_set_nomerge ( q , req ) ;
2008-01-29 14:04:06 +01:00
return 0 ;
}
2008-05-07 09:33:55 +02:00
if ( ! bio_flagged ( req - > biotail , BIO_SEG_VALID ) )
2008-01-29 14:04:06 +01:00
blk_recount_segments ( q , req - > biotail ) ;
2008-05-07 09:33:55 +02:00
if ( ! bio_flagged ( bio , BIO_SEG_VALID ) )
2008-01-29 14:04:06 +01:00
blk_recount_segments ( q , bio ) ;
return ll_new_hw_segment ( q , req , bio ) ;
}
2008-01-31 13:03:55 +01:00
int ll_front_merge_fn ( struct request_queue * q , struct request * req ,
2008-01-29 14:04:06 +01:00
struct bio * bio )
{
2015-09-03 19:28:20 +03:00
if ( req_gap_front_merge ( req , bio ) )
return 0 ;
2015-09-11 09:03:04 -06:00
if ( blk_integrity_rq ( req ) & &
integrity_req_gap_front_merge ( req , bio ) )
return 0 ;
2012-09-18 12:19:26 -04:00
if ( blk_rq_sectors ( req ) + bio_sectors ( bio ) >
2016-07-20 21:40:47 -06:00
blk_rq_get_max_sectors ( req , bio - > bi_iter . bi_sector ) ) {
2016-12-01 08:36:16 -07:00
req_set_nomerge ( q , req ) ;
2008-01-29 14:04:06 +01:00
return 0 ;
}
2008-05-07 09:33:55 +02:00
if ( ! bio_flagged ( bio , BIO_SEG_VALID ) )
2008-01-29 14:04:06 +01:00
blk_recount_segments ( q , bio ) ;
2008-05-07 09:33:55 +02:00
if ( ! bio_flagged ( req - > bio , BIO_SEG_VALID ) )
2008-01-29 14:04:06 +01:00
blk_recount_segments ( q , req - > bio ) ;
return ll_new_hw_segment ( q , req , bio ) ;
}
2013-10-29 12:11:47 -06:00
/*
* blk - mq uses req - > special to carry normal driver per - request payload , it
* does not indicate a prepared command that we cannot merge with .
*/
static bool req_no_special_merge ( struct request * req )
{
struct request_queue * q = req - > q ;
return ! q - > mq_ops & & req - > special ;
}
2008-01-29 14:04:06 +01:00
static int ll_merge_requests_fn ( struct request_queue * q , struct request * req ,
struct request * next )
{
int total_phys_segments ;
2008-10-13 14:19:05 +02:00
unsigned int seg_size =
req - > biotail - > bi_seg_back_size + next - > bio - > bi_seg_front_size ;
2008-01-29 14:04:06 +01:00
/*
* First check if the either of the requests are re - queued
* requests . Can ' t merge them if they are .
*/
2013-10-29 12:11:47 -06:00
if ( req_no_special_merge ( req ) | | req_no_special_merge ( next ) )
2008-01-29 14:04:06 +01:00
return 0 ;
2015-09-03 19:28:20 +03:00
if ( req_gap_back_merge ( req , next - > bio ) )
2015-02-11 08:20:13 -07:00
return 0 ;
2008-01-29 14:04:06 +01:00
/*
* Will it become too large ?
*/
2012-09-18 12:19:26 -04:00
if ( ( blk_rq_sectors ( req ) + blk_rq_sectors ( next ) ) >
2016-07-20 21:40:47 -06:00
blk_rq_get_max_sectors ( req , blk_rq_pos ( req ) ) )
2008-01-29 14:04:06 +01:00
return 0 ;
total_phys_segments = req - > nr_phys_segments + next - > nr_phys_segments ;
2008-10-13 14:19:05 +02:00
if ( blk_phys_contig_segment ( q , req - > biotail , next - > bio ) ) {
if ( req - > nr_phys_segments = = 1 )
req - > bio - > bi_seg_front_size = seg_size ;
if ( next - > nr_phys_segments = = 1 )
next - > biotail - > bi_seg_back_size = seg_size ;
2008-01-29 14:04:06 +01:00
total_phys_segments - - ;
2008-10-13 14:19:05 +02:00
}
2008-01-29 14:04:06 +01:00
2010-02-26 00:20:39 -05:00
if ( total_phys_segments > queue_max_segments ( q ) )
2008-01-29 14:04:06 +01:00
return 0 ;
2014-09-26 19:20:06 -04:00
if ( blk_integrity_merge_rq ( q , req , next ) = = false )
2010-09-10 20:50:10 +02:00
return 0 ;
2008-01-29 14:04:06 +01:00
/* Merge is OK... */
req - > nr_phys_segments = total_phys_segments ;
return 1 ;
}
2009-07-03 17:48:17 +09:00
/**
* blk_rq_set_mixed_merge - mark a request as mixed merge
* @ rq : request to mark as mixed merge
*
* Description :
* @ rq is about to be mixed merged . Make sure the attributes
* which can be mixed are set in each bio and mark @ rq as mixed
* merged .
*/
void blk_rq_set_mixed_merge ( struct request * rq )
{
unsigned int ff = rq - > cmd_flags & REQ_FAILFAST_MASK ;
struct bio * bio ;
2016-10-20 15:12:13 +02:00
if ( rq - > rq_flags & RQF_MIXED_MERGE )
2009-07-03 17:48:17 +09:00
return ;
/*
* @ rq will no longer represent mixable attributes for all the
* contained bios . It will just track those of the first one .
* Distributes the attributs to each bio .
*/
for ( bio = rq - > bio ; bio ; bio = bio - > bi_next ) {
2016-08-05 15:35:16 -06:00
WARN_ON_ONCE ( ( bio - > bi_opf & REQ_FAILFAST_MASK ) & &
( bio - > bi_opf & REQ_FAILFAST_MASK ) ! = ff ) ;
bio - > bi_opf | = ff ;
2009-07-03 17:48:17 +09:00
}
2016-10-20 15:12:13 +02:00
rq - > rq_flags | = RQF_MIXED_MERGE ;
2009-07-03 17:48:17 +09:00
}
2009-03-27 10:31:51 +01:00
static void blk_account_io_merge ( struct request * req )
{
if ( blk_do_io_stat ( req ) ) {
struct hd_struct * part ;
int cpu ;
cpu = part_stat_lock ( ) ;
2011-01-05 16:57:38 +01:00
part = req - > part ;
2009-03-27 10:31:51 +01:00
part_round_stats ( cpu , part ) ;
block: Seperate read and write statistics of in_flight requests v2
Commit a9327cac440be4d8333bba975cbbf76045096275 added seperate read
and write statistics of in_flight requests. And exported the number
of read and write requests in progress seperately through sysfs.
But Corrado Zoccolo <czoccolo@gmail.com> reported getting strange
output from "iostat -kx 2". Global values for service time and
utilization were garbage. For interval values, utilization was always
100%, and service time is higher than normal.
So this was reverted by commit 0f78ab9899e9d6acb09d5465def618704255963b
The problem was in part_round_stats_single(), I missed the following:
if (now == part->stamp)
return;
- if (part->in_flight) {
+ if (part_in_flight(part)) {
__part_stat_add(cpu, part, time_in_queue,
part_in_flight(part) * (now - part->stamp));
__part_stat_add(cpu, part, io_ticks, (now - part->stamp));
With this chunk included, the reported regression gets fixed.
Signed-off-by: Nikanth Karthikesan <knikanth@suse.de>
--
Signed-off-by: Jens Axboe <jens.axboe@oracle.com>
2009-10-06 20:16:55 +02:00
part_dec_in_flight ( part , rq_data_dir ( req ) ) ;
2009-03-27 10:31:51 +01:00
2011-01-07 08:43:37 +01:00
hd_struct_put ( part ) ;
2009-03-27 10:31:51 +01:00
part_stat_unlock ( ) ;
}
}
2008-01-29 14:04:06 +01:00
/*
2017-02-02 08:54:40 -07:00
* For non - mq , this has to be called with the request spinlock acquired .
* For mq with scheduling , the appropriate queue wide lock should be held .
2008-01-29 14:04:06 +01:00
*/
2017-02-02 08:54:40 -07:00
static struct request * attempt_merge ( struct request_queue * q ,
struct request * req , struct request * next )
2008-01-29 14:04:06 +01:00
{
if ( ! rq_mergeable ( req ) | | ! rq_mergeable ( next ) )
2017-02-02 08:54:40 -07:00
return NULL ;
2008-01-29 14:04:06 +01:00
2016-06-09 16:00:36 +02:00
if ( req_op ( req ) ! = req_op ( next ) )
2017-02-02 08:54:40 -07:00
return NULL ;
2012-09-18 12:19:26 -04:00
2008-01-29 14:04:06 +01:00
/*
* not contiguous
*/
2009-05-07 22:24:39 +09:00
if ( blk_rq_pos ( req ) + blk_rq_sectors ( req ) ! = blk_rq_pos ( next ) )
2017-02-02 08:54:40 -07:00
return NULL ;
2008-01-29 14:04:06 +01:00
if ( rq_data_dir ( req ) ! = rq_data_dir ( next )
| | req - > rq_disk ! = next - > rq_disk
2013-10-29 12:11:47 -06:00
| | req_no_special_merge ( next ) )
2017-02-02 08:54:40 -07:00
return NULL ;
2008-01-29 14:04:06 +01:00
2016-06-05 14:32:15 -05:00
if ( req_op ( req ) = = REQ_OP_WRITE_SAME & &
2012-09-18 12:19:27 -04:00
! blk_write_same_mergeable ( req - > bio , next - > bio ) )
2017-02-02 08:54:40 -07:00
return NULL ;
2012-09-18 12:19:27 -04:00
2008-01-29 14:04:06 +01:00
/*
* If we are allowed to merge , then append bio list
* from next to rq and release next . merge_requests_fn
* will have updated segment counts , update sector
* counts here .
*/
if ( ! ll_merge_requests_fn ( q , req , next ) )
2017-02-02 08:54:40 -07:00
return NULL ;
2008-01-29 14:04:06 +01:00
2009-07-03 17:48:17 +09:00
/*
* If failfast settings disagree or any of the two is already
* a mixed merge , mark both as mixed before proceeding . This
* makes sure that all involved bios have mixable attributes
* set properly .
*/
2016-10-20 15:12:13 +02:00
if ( ( ( req - > rq_flags | next - > rq_flags ) & RQF_MIXED_MERGE ) | |
2009-07-03 17:48:17 +09:00
( req - > cmd_flags & REQ_FAILFAST_MASK ) ! =
( next - > cmd_flags & REQ_FAILFAST_MASK ) ) {
blk_rq_set_mixed_merge ( req ) ;
blk_rq_set_mixed_merge ( next ) ;
}
2008-01-29 14:04:06 +01:00
/*
* At this point we have either done a back merge
* or front merge . We need the smaller start_time of
* the merged requests to be the current request
* for accounting purposes .
*/
if ( time_after ( req - > start_time , next - > start_time ) )
req - > start_time = next - > start_time ;
req - > biotail - > bi_next = next - > bio ;
req - > biotail = next - > biotail ;
2009-05-07 22:24:44 +09:00
req - > __data_len + = blk_rq_bytes ( next ) ;
2008-01-29 14:04:06 +01:00
elv_merge_requests ( q , req , next ) ;
2009-04-22 14:01:49 +02:00
/*
* ' next ' is going away , so update stats accordingly
*/
blk_account_io_merge ( next ) ;
2008-01-29 14:04:06 +01:00
req - > ioprio = ioprio_best ( req - > ioprio , next - > ioprio ) ;
2008-08-26 10:25:02 +02:00
if ( blk_rq_cpu_valid ( next ) )
req - > cpu = next - > cpu ;
2008-01-29 14:04:06 +01:00
2017-02-03 09:48:28 -07:00
/*
* ownership of bio passed from next to req , return ' next ' for
* the caller to free
*/
2009-03-24 12:35:07 +01:00
next - > bio = NULL ;
2017-02-02 08:54:40 -07:00
return next ;
2008-01-29 14:04:06 +01:00
}
2017-02-02 08:54:40 -07:00
struct request * attempt_back_merge ( struct request_queue * q , struct request * rq )
2008-01-29 14:04:06 +01:00
{
struct request * next = elv_latter_request ( q , rq ) ;
if ( next )
return attempt_merge ( q , rq , next ) ;
2017-02-02 08:54:40 -07:00
return NULL ;
2008-01-29 14:04:06 +01:00
}
2017-02-02 08:54:40 -07:00
struct request * attempt_front_merge ( struct request_queue * q , struct request * rq )
2008-01-29 14:04:06 +01:00
{
struct request * prev = elv_former_request ( q , rq ) ;
if ( prev )
return attempt_merge ( q , prev , rq ) ;
2017-02-02 08:54:40 -07:00
return NULL ;
2008-01-29 14:04:06 +01:00
}
2011-03-21 10:14:27 +01:00
int blk_attempt_req_merge ( struct request_queue * q , struct request * rq ,
struct request * next )
{
2016-07-07 11:48:22 -07:00
struct elevator_queue * e = q - > elevator ;
2017-02-03 09:48:28 -07:00
struct request * free ;
2016-07-07 11:48:22 -07:00
2017-01-17 06:03:22 -07:00
if ( ! e - > uses_mq & & e - > type - > ops . sq . elevator_allow_rq_merge_fn )
2016-12-10 15:13:59 -07:00
if ( ! e - > type - > ops . sq . elevator_allow_rq_merge_fn ( q , rq , next ) )
2016-07-07 11:48:22 -07:00
return 0 ;
2017-02-03 09:48:28 -07:00
free = attempt_merge ( q , rq , next ) ;
if ( free ) {
__blk_put_request ( q , free ) ;
return 1 ;
}
return 0 ;
2011-03-21 10:14:27 +01:00
}
2012-02-08 09:19:38 +01:00
bool blk_rq_merge_ok ( struct request * rq , struct bio * bio )
{
2012-09-18 12:19:25 -04:00
if ( ! rq_mergeable ( rq ) | | ! bio_mergeable ( bio ) )
2012-02-08 09:19:38 +01:00
return false ;
2016-06-09 16:00:36 +02:00
if ( req_op ( rq ) ! = bio_op ( bio ) )
2012-09-18 12:19:26 -04:00
return false ;
2012-02-08 09:19:38 +01:00
/* different data direction or already started, don't merge */
if ( bio_data_dir ( bio ) ! = rq_data_dir ( rq ) )
return false ;
/* must be same device and not a special request */
2013-10-29 12:11:47 -06:00
if ( rq - > rq_disk ! = bio - > bi_bdev - > bd_disk | | req_no_special_merge ( rq ) )
2012-02-08 09:19:38 +01:00
return false ;
/* only merge integrity protected bio into ditto rq */
2014-09-26 19:20:06 -04:00
if ( blk_integrity_merge_bio ( rq - > q , rq , bio ) = = false )
2012-02-08 09:19:38 +01:00
return false ;
2012-09-18 12:19:27 -04:00
/* must be using the same buffer */
2016-06-05 14:32:15 -05:00
if ( req_op ( rq ) = = REQ_OP_WRITE_SAME & &
2012-09-18 12:19:27 -04:00
! blk_write_same_mergeable ( rq - > bio , bio ) )
return false ;
2012-02-08 09:19:38 +01:00
return true ;
}
2017-02-08 14:46:48 +01:00
enum elv_merge blk_try_merge ( struct request * rq , struct bio * bio )
2012-02-08 09:19:38 +01:00
{
2017-02-08 14:46:49 +01:00
if ( req_op ( rq ) = = REQ_OP_DISCARD & &
queue_max_discard_segments ( rq - > q ) > 1 )
return ELEVATOR_DISCARD_MERGE ;
else if ( blk_rq_pos ( rq ) + blk_rq_sectors ( rq ) = = bio - > bi_iter . bi_sector )
2012-02-08 09:19:38 +01:00
return ELEVATOR_BACK_MERGE ;
2013-10-11 15:44:27 -07:00
else if ( blk_rq_pos ( rq ) - bio_sectors ( bio ) = = bio - > bi_iter . bi_sector )
2012-02-08 09:19:38 +01:00
return ELEVATOR_FRONT_MERGE ;
return ELEVATOR_NO_MERGE ;
}