2019-05-19 15:08:55 +03:00
// SPDX-License-Identifier: GPL-2.0-only
2005-04-17 02:20:36 +04:00
/*
2014-01-17 15:06:53 +04:00
* Copyright ( C ) 1999 Eric Youngdale
* Copyright ( C ) 2014 Christoph Hellwig
2005-04-17 02:20:36 +04:00
*
* SCSI queueing library .
* Initial versions : Eric Youngdale ( eric @ andante . org ) .
* Based upon conversations with large numbers
* of people at Linux Expo .
*/
# include <linux/bio.h>
2008-01-15 20:11:46 +03:00
# include <linux/bitops.h>
2005-04-17 02:20:36 +04:00
# include <linux/blkdev.h>
# include <linux/completion.h>
# include <linux/kernel.h>
2011-05-27 17:37:25 +04:00
# include <linux/export.h>
2005-04-17 02:20:36 +04:00
# include <linux/init.h>
# include <linux/pci.h>
# include <linux/delay.h>
2006-02-14 19:42:07 +03:00
# include <linux/hardirq.h>
2007-10-16 13:08:49 +04:00
# include <linux/scatterlist.h>
2014-01-17 15:06:53 +04:00
# include <linux/blk-mq.h>
2021-09-20 15:33:27 +03:00
# include <linux/blk-integrity.h>
2014-10-24 16:27:07 +04:00
# include <linux/ratelimit.h>
2015-12-01 12:16:57 +03:00
# include <asm/unaligned.h>
2005-04-17 02:20:36 +04:00
# include <scsi/scsi.h>
2006-06-10 20:01:03 +04:00
# include <scsi/scsi_cmnd.h>
2005-04-17 02:20:36 +04:00
# include <scsi/scsi_dbg.h>
# include <scsi/scsi_device.h>
# include <scsi/scsi_driver.h>
# include <scsi/scsi_eh.h>
# include <scsi/scsi_host.h>
2017-05-02 20:45:03 +03:00
# include <scsi/scsi_transport.h> /* __scsi_init_queue() */
2015-08-27 15:16:59 +03:00
# include <scsi/scsi_dh.h>
2005-04-17 02:20:36 +04:00
2014-05-06 14:25:40 +04:00
# include <trace/events/scsi.h>
2017-04-26 23:47:57 +03:00
# include "scsi_debugfs.h"
2005-04-17 02:20:36 +04:00
# include "scsi_priv.h"
# include "scsi_logging.h"
2019-04-28 10:39:31 +03:00
/*
* Size of integrity metadata is usually small , 1 inline sg should
* cover normal cases .
*/
2019-06-06 11:34:09 +03:00
# ifdef CONFIG_ARCH_NO_SG_CHAIN
# define SCSI_INLINE_PROT_SG_CNT 0
# define SCSI_INLINE_SG_CNT 0
# else
2019-04-28 10:39:31 +03:00
# define SCSI_INLINE_PROT_SG_CNT 1
2019-04-28 10:39:32 +03:00
# define SCSI_INLINE_SG_CNT 2
2019-06-06 11:34:09 +03:00
# endif
2019-04-28 10:39:32 +03:00
2017-01-03 08:28:41 +03:00
static struct kmem_cache * scsi_sense_cache ;
static DEFINE_MUTEX ( scsi_sense_cache_mutex ) ;
2005-04-17 02:20:36 +04:00
2017-08-31 02:58:42 +03:00
static void scsi_mq_uninit_cmd ( struct scsi_cmnd * cmd ) ;
2017-01-03 08:28:41 +03:00
int scsi_init_sense_cache ( struct Scsi_Host * shost )
{
int ret = 0 ;
2019-07-12 05:08:19 +03:00
mutex_lock ( & scsi_sense_cache_mutex ) ;
2021-03-31 10:29:58 +03:00
if ( ! scsi_sense_cache ) {
2017-01-03 08:28:41 +03:00
scsi_sense_cache =
2017-06-11 05:50:45 +03:00
kmem_cache_create_usercopy ( " scsi_sense_cache " ,
SCSI_SENSE_BUFFERSIZE , 0 , SLAB_HWCACHE_ALIGN ,
0 , SCSI_SENSE_BUFFERSIZE , NULL ) ;
2017-01-03 08:28:41 +03:00
if ( ! scsi_sense_cache )
ret = - ENOMEM ;
}
mutex_unlock ( & scsi_sense_cache_mutex ) ;
return ret ;
}
2007-12-13 14:50:53 +03:00
2010-04-16 23:13:15 +04:00
/*
* When to reinvoke queueing after a resource shortage . It ' s 3 msecs to
* not change behaviour from the previous unplug mechanism , experimentation
* may prove this needs changing .
*/
# define SCSI_QUEUE_DELAY 3
2014-01-23 16:55:38 +04:00
static void
scsi_set_blocked ( struct scsi_cmnd * cmd , int reason )
2005-04-17 02:20:36 +04:00
{
struct Scsi_Host * host = cmd - > device - > host ;
struct scsi_device * device = cmd - > device ;
[SCSI] Add helper code so transport classes/driver can control queueing (v3)
SCSI-ml manages the queueing limits for the device and host, but
does not do so at the target level. However something something similar
can come in userful when a driver is transitioning a transport object to
the the blocked state, becuase at that time we do not want to queue
io and we do not want the queuecommand to be called again.
The patch adds code similar to the exisiting SCSI_ML_*BUSY handlers.
You can now return SCSI_MLQUEUE_TARGET_BUSY when we hit
a transport level queueing issue like the hw cannot allocate some
resource at the iscsi session/connection level, or the target has temporarily
closed or shrunk the queueing window, or if we are transitioning
to the blocked state.
bnx2i, when they rework their firmware according to netdev
developers requests, will also need to be able to limit queueing at this
level. bnx2i will hook into libiscsi, but will allocate a scsi host per
netdevice/hba, so unlike pure software iscsi/iser which is allocating
a host per session, it cannot set the scsi_host->can_queue and return
SCSI_MLQUEUE_HOST_BUSY to reflect queueing limits on the transport.
The iscsi class/driver can also set a scsi_target->can_queue value which
reflects the max commands the driver/class can support. For iscsi this
reflects the number of commands we can support for each session due to
session/connection hw limits, driver limits, and to also reflect the
session/targets's queueing window.
Changes:
v1 - initial patch.
v2 - Fix scsi_run_queue handling of multiple blocked targets.
Previously we would break from the main loop if a device was added back on
the starved list. We now run over the list and check if any target is
blocked.
v3 - Rediff for scsi-misc.
Signed-off-by: Mike Christie <michaelc@cs.wisc.edu>
Signed-off-by: James Bottomley <James.Bottomley@HansenPartnership.com>
2008-08-18 00:24:38 +04:00
struct scsi_target * starget = scsi_target ( device ) ;
2005-04-17 02:20:36 +04:00
/*
2005-05-13 19:46:08 +04:00
* Set the appropriate busy bit for the device / host .
2005-04-17 02:20:36 +04:00
*
* If the host / device isn ' t busy , assume that something actually
* completed , and that we should be able to queue a command now .
*
* Note that the prior mid - layer assumption that any host could
* always queue at least one command is now broken . The mid - layer
* will implement a user specifiable stall ( see
* scsi_host . max_host_blocked and scsi_device . max_device_blocked )
* if a command is requeued with no other commands outstanding
* either for the device or for the host .
*/
[SCSI] Add helper code so transport classes/driver can control queueing (v3)
SCSI-ml manages the queueing limits for the device and host, but
does not do so at the target level. However something something similar
can come in userful when a driver is transitioning a transport object to
the the blocked state, becuase at that time we do not want to queue
io and we do not want the queuecommand to be called again.
The patch adds code similar to the exisiting SCSI_ML_*BUSY handlers.
You can now return SCSI_MLQUEUE_TARGET_BUSY when we hit
a transport level queueing issue like the hw cannot allocate some
resource at the iscsi session/connection level, or the target has temporarily
closed or shrunk the queueing window, or if we are transitioning
to the blocked state.
bnx2i, when they rework their firmware according to netdev
developers requests, will also need to be able to limit queueing at this
level. bnx2i will hook into libiscsi, but will allocate a scsi host per
netdevice/hba, so unlike pure software iscsi/iser which is allocating
a host per session, it cannot set the scsi_host->can_queue and return
SCSI_MLQUEUE_HOST_BUSY to reflect queueing limits on the transport.
The iscsi class/driver can also set a scsi_target->can_queue value which
reflects the max commands the driver/class can support. For iscsi this
reflects the number of commands we can support for each session due to
session/connection hw limits, driver limits, and to also reflect the
session/targets's queueing window.
Changes:
v1 - initial patch.
v2 - Fix scsi_run_queue handling of multiple blocked targets.
Previously we would break from the main loop if a device was added back on
the starved list. We now run over the list and check if any target is
blocked.
v3 - Rediff for scsi-misc.
Signed-off-by: Mike Christie <michaelc@cs.wisc.edu>
Signed-off-by: James Bottomley <James.Bottomley@HansenPartnership.com>
2008-08-18 00:24:38 +04:00
switch ( reason ) {
case SCSI_MLQUEUE_HOST_BUSY :
2014-01-23 15:07:41 +04:00
atomic_set ( & host - > host_blocked , host - > max_host_blocked ) ;
[SCSI] Add helper code so transport classes/driver can control queueing (v3)
SCSI-ml manages the queueing limits for the device and host, but
does not do so at the target level. However something something similar
can come in userful when a driver is transitioning a transport object to
the the blocked state, becuase at that time we do not want to queue
io and we do not want the queuecommand to be called again.
The patch adds code similar to the exisiting SCSI_ML_*BUSY handlers.
You can now return SCSI_MLQUEUE_TARGET_BUSY when we hit
a transport level queueing issue like the hw cannot allocate some
resource at the iscsi session/connection level, or the target has temporarily
closed or shrunk the queueing window, or if we are transitioning
to the blocked state.
bnx2i, when they rework their firmware according to netdev
developers requests, will also need to be able to limit queueing at this
level. bnx2i will hook into libiscsi, but will allocate a scsi host per
netdevice/hba, so unlike pure software iscsi/iser which is allocating
a host per session, it cannot set the scsi_host->can_queue and return
SCSI_MLQUEUE_HOST_BUSY to reflect queueing limits on the transport.
The iscsi class/driver can also set a scsi_target->can_queue value which
reflects the max commands the driver/class can support. For iscsi this
reflects the number of commands we can support for each session due to
session/connection hw limits, driver limits, and to also reflect the
session/targets's queueing window.
Changes:
v1 - initial patch.
v2 - Fix scsi_run_queue handling of multiple blocked targets.
Previously we would break from the main loop if a device was added back on
the starved list. We now run over the list and check if any target is
blocked.
v3 - Rediff for scsi-misc.
Signed-off-by: Mike Christie <michaelc@cs.wisc.edu>
Signed-off-by: James Bottomley <James.Bottomley@HansenPartnership.com>
2008-08-18 00:24:38 +04:00
break ;
case SCSI_MLQUEUE_DEVICE_BUSY :
[SCSI] scsi_lib: pause between error retries
During cable pull tests on our 16G FC adapter, we are seeing errors,
typically reads to close targets, which fail due to CRC or framing
errors caused by the cable being pull (return status DID_ERROR).
The adapter detects the error on one of the first frames received,
marks the FC exchange as dead (further frames go to bit bucket) and
signals the host of the error. This action is so quick, and coupled
with fast host CPUs, creates a scenario in which the midlayer sees
the failure and retries the io almost immediately. We've seen link
traces with the retry on the link while the original i/o is still
being processed by the target. We're also seeing the time window
for the "link to pull-apart" and the physical interface to report
disconnected to be in the few millisecond range. Which means, we're
encountering scenarios where the full retry count is exhausted
(all with error) by the midlayer before the link disconnect state
is detected.
We looked at 8G FC behavior and occasionally see the same behavior,
but as the link was slower, it rarely could exhaust all retries
before the link reported disconnect.
What is needed is a slight delay between io retries due to DID_ERROR
to cover this error. It is inappropriate to put this delay in the
driver, as the error is indistinguishable from other link-related errors,
nor does the driver track whether the io is a retry or not. This is also
easier than tracking between-io-error bursts that are seen in this
scenario.
The patch below updates the retry path so that it inserts a delay as
if the target was busy. The busy delay is on the order of 6ms. This
delay is sufficient to ensure the link down condition is reported
before the retry count is exhausted (at most 1 retry is seen).
Signed-off-by: Alex Iannicelli <alex.iannicelli@emulex.com>
Signed-off-by: James Smart <james.smart@emulex.com>
Signed-off-by: James Bottomley <JBottomley@Parallels.com>
2011-07-06 20:45:17 +04:00
case SCSI_MLQUEUE_EH_RETRY :
2014-01-23 15:07:41 +04:00
atomic_set ( & device - > device_blocked ,
device - > max_device_blocked ) ;
[SCSI] Add helper code so transport classes/driver can control queueing (v3)
SCSI-ml manages the queueing limits for the device and host, but
does not do so at the target level. However something something similar
can come in userful when a driver is transitioning a transport object to
the the blocked state, becuase at that time we do not want to queue
io and we do not want the queuecommand to be called again.
The patch adds code similar to the exisiting SCSI_ML_*BUSY handlers.
You can now return SCSI_MLQUEUE_TARGET_BUSY when we hit
a transport level queueing issue like the hw cannot allocate some
resource at the iscsi session/connection level, or the target has temporarily
closed or shrunk the queueing window, or if we are transitioning
to the blocked state.
bnx2i, when they rework their firmware according to netdev
developers requests, will also need to be able to limit queueing at this
level. bnx2i will hook into libiscsi, but will allocate a scsi host per
netdevice/hba, so unlike pure software iscsi/iser which is allocating
a host per session, it cannot set the scsi_host->can_queue and return
SCSI_MLQUEUE_HOST_BUSY to reflect queueing limits on the transport.
The iscsi class/driver can also set a scsi_target->can_queue value which
reflects the max commands the driver/class can support. For iscsi this
reflects the number of commands we can support for each session due to
session/connection hw limits, driver limits, and to also reflect the
session/targets's queueing window.
Changes:
v1 - initial patch.
v2 - Fix scsi_run_queue handling of multiple blocked targets.
Previously we would break from the main loop if a device was added back on
the starved list. We now run over the list and check if any target is
blocked.
v3 - Rediff for scsi-misc.
Signed-off-by: Mike Christie <michaelc@cs.wisc.edu>
Signed-off-by: James Bottomley <James.Bottomley@HansenPartnership.com>
2008-08-18 00:24:38 +04:00
break ;
case SCSI_MLQUEUE_TARGET_BUSY :
2014-01-23 15:07:41 +04:00
atomic_set ( & starget - > target_blocked ,
starget - > max_target_blocked ) ;
[SCSI] Add helper code so transport classes/driver can control queueing (v3)
SCSI-ml manages the queueing limits for the device and host, but
does not do so at the target level. However something something similar
can come in userful when a driver is transitioning a transport object to
the the blocked state, becuase at that time we do not want to queue
io and we do not want the queuecommand to be called again.
The patch adds code similar to the exisiting SCSI_ML_*BUSY handlers.
You can now return SCSI_MLQUEUE_TARGET_BUSY when we hit
a transport level queueing issue like the hw cannot allocate some
resource at the iscsi session/connection level, or the target has temporarily
closed or shrunk the queueing window, or if we are transitioning
to the blocked state.
bnx2i, when they rework their firmware according to netdev
developers requests, will also need to be able to limit queueing at this
level. bnx2i will hook into libiscsi, but will allocate a scsi host per
netdevice/hba, so unlike pure software iscsi/iser which is allocating
a host per session, it cannot set the scsi_host->can_queue and return
SCSI_MLQUEUE_HOST_BUSY to reflect queueing limits on the transport.
The iscsi class/driver can also set a scsi_target->can_queue value which
reflects the max commands the driver/class can support. For iscsi this
reflects the number of commands we can support for each session due to
session/connection hw limits, driver limits, and to also reflect the
session/targets's queueing window.
Changes:
v1 - initial patch.
v2 - Fix scsi_run_queue handling of multiple blocked targets.
Previously we would break from the main loop if a device was added back on
the starved list. We now run over the list and check if any target is
blocked.
v3 - Rediff for scsi-misc.
Signed-off-by: Mike Christie <michaelc@cs.wisc.edu>
Signed-off-by: James Bottomley <James.Bottomley@HansenPartnership.com>
2008-08-18 00:24:38 +04:00
break ;
}
2014-01-23 16:55:38 +04:00
}
2014-01-17 15:06:53 +04:00
static void scsi_mq_requeue_cmd ( struct scsi_cmnd * cmd )
{
2021-08-10 02:03:05 +03:00
struct request * rq = scsi_cmd_to_rq ( cmd ) ;
if ( rq - > rq_flags & RQF_DONTPREP ) {
rq - > rq_flags & = ~ RQF_DONTPREP ;
2017-08-31 02:58:42 +03:00
scsi_mq_uninit_cmd ( cmd ) ;
} else {
WARN_ON_ONCE ( true ) ;
}
2021-08-10 02:03:05 +03:00
blk_mq_requeue_request ( rq , true ) ;
2014-01-17 15:06:53 +04:00
}
2014-01-23 16:55:38 +04:00
/**
* __scsi_queue_insert - private queue insertion
* @ cmd : The SCSI command being requeued
* @ reason : The reason for the requeue
* @ unbusy : Whether the queue should be unbusied
*
* This is a private queue insertion . The public interface
* scsi_queue_insert ( ) always assumes the queue should be unbusied
* because it ' s always called before the completion . This function is
* for a requeue after completion , which should only occur in this
* file .
*/
2018-01-11 01:41:45 +03:00
static void __scsi_queue_insert ( struct scsi_cmnd * cmd , int reason , bool unbusy )
2014-01-23 16:55:38 +04:00
{
struct scsi_device * device = cmd - > device ;
SCSI_LOG_MLQUEUE ( 1 , scmd_printk ( KERN_INFO , cmd ,
" Inserting command %p into mlqueue \n " , cmd ) ) ;
scsi_set_blocked ( cmd , reason ) ;
2005-04-17 02:20:36 +04:00
/*
* Decrement the counters , since these commands are no longer
* active on the host / device .
*/
2009-01-02 19:42:21 +03:00
if ( unbusy )
2019-10-25 09:58:55 +03:00
scsi_device_unbusy ( device , cmd ) ;
2005-04-17 02:20:36 +04:00
/*
2005-04-24 11:08:52 +04:00
* Requeue this command . It will go before all other commands
2012-06-29 19:36:07 +04:00
* that are already in the queue . Schedule requeue work under
* lock such that the kblockd_schedule_work ( ) call happens
* before blk_cleanup_queue ( ) finishes .
2010-04-16 23:13:15 +04:00
*/
2014-03-28 21:51:15 +04:00
cmd - > result = 0 ;
2018-11-02 01:36:27 +03:00
2021-08-10 02:03:05 +03:00
blk_mq_requeue_request ( scsi_cmd_to_rq ( cmd ) , true ) ;
2005-04-17 02:20:36 +04:00
}
2020-04-19 08:01:48 +03:00
/**
* scsi_queue_insert - Reinsert a command in the queue .
* @ cmd : command that we are adding to queue .
* @ reason : why we are inserting command to queue .
2009-01-02 19:42:21 +03:00
*
2020-04-19 08:01:48 +03:00
* We do this for one of two cases . Either the host is busy and it cannot accept
* any more commands for the time being , or the device returned QUEUE_FULL and
* can accept no more commands .
2009-01-02 19:42:21 +03:00
*
2020-04-19 08:01:48 +03:00
* Context : This could be called either from an interrupt context or a normal
* process context .
2009-01-02 19:42:21 +03:00
*/
2012-06-29 19:35:05 +04:00
void scsi_queue_insert ( struct scsi_cmnd * cmd , int reason )
2009-01-02 19:42:21 +03:00
{
2018-01-11 01:41:45 +03:00
__scsi_queue_insert ( cmd , reason , true ) ;
2009-01-02 19:42:21 +03:00
}
2016-10-20 16:12:13 +03:00
2017-02-23 18:02:36 +03:00
/**
2018-07-31 22:51:54 +03:00
* __scsi_execute - insert request and wait for the result
2017-02-23 18:02:36 +03:00
* @ sdev : scsi device
* @ cmd : scsi command
* @ data_direction : data direction
* @ buffer : data buffer
* @ bufflen : len of buffer
* @ sense : optional sense buffer
* @ sshdr : optional decoded sense header
2021-07-09 23:26:20 +03:00
* @ timeout : request timeout in HZ
2017-02-23 18:02:36 +03:00
* @ retries : number of times to retry request
* @ flags : flags for - > cmd_flags
* @ rq_flags : flags for - > rq_flags
* @ resid : optional residual length
*
2017-04-20 17:03:01 +03:00
* Returns the scsi_cmnd result field if a command was executed , or a negative
* Linux error code if we didn ' t get that far .
2017-02-23 18:02:36 +03:00
*/
2018-07-31 22:51:54 +03:00
int __scsi_execute ( struct scsi_device * sdev , const unsigned char * cmd ,
2005-08-28 20:31:14 +04:00
int data_direction , void * buffer , unsigned bufflen ,
2017-02-14 22:15:58 +03:00
unsigned char * sense , struct scsi_sense_hdr * sshdr ,
int timeout , int retries , u64 flags , req_flags_t rq_flags ,
int * resid )
2005-06-16 03:48:29 +04:00
{
struct request * req ;
2017-01-27 11:46:29 +03:00
struct scsi_request * rq ;
2021-04-27 11:30:12 +03:00
int ret ;
2005-06-16 03:48:29 +04:00
2021-10-21 09:06:05 +03:00
req = scsi_alloc_request ( sdev - > request_queue ,
2017-01-31 18:57:31 +03:00
data_direction = = DMA_TO_DEVICE ?
2021-06-24 15:39:34 +03:00
REQ_OP_DRV_OUT : REQ_OP_DRV_IN ,
2020-12-09 08:29:49 +03:00
rq_flags & RQF_PM ? BLK_MQ_REQ_PM : 0 ) ;
2014-08-28 18:15:21 +04:00
if ( IS_ERR ( req ) )
2021-04-27 11:30:12 +03:00
return PTR_ERR ( req ) ;
2005-06-16 03:48:29 +04:00
2021-04-27 11:30:12 +03:00
rq = scsi_req ( req ) ;
2005-06-16 03:48:29 +04:00
2021-04-27 11:30:12 +03:00
if ( bufflen ) {
ret = blk_rq_map_kern ( sdev - > request_queue , req ,
buffer , bufflen , GFP_NOIO ) ;
if ( ret )
goto out ;
}
2017-01-27 11:46:29 +03:00
rq - > cmd_len = COMMAND_SIZE ( cmd [ 0 ] ) ;
memcpy ( rq - > cmd , cmd , rq - > cmd_len ) ;
2017-04-05 20:18:12 +03:00
rq - > retries = retries ;
2005-06-16 03:48:29 +04:00
req - > timeout = timeout ;
2016-10-20 16:12:13 +03:00
req - > cmd_flags | = flags ;
2017-11-09 21:49:56 +03:00
req - > rq_flags | = rq_flags | RQF_QUIET ;
2005-06-16 03:48:29 +04:00
/*
* head injection * required * here otherwise quiesce won ' t work
*/
2021-11-26 15:18:01 +03:00
blk_execute_rq ( req , true ) ;
2005-06-16 03:48:29 +04:00
2008-06-24 22:03:14 +04:00
/*
* Some devices ( USB mass - storage in particular ) may transfer
* garbage data together with a residue indicating that the data
* is invalid . Prevent the garbage from being misinterpreted
* and prevent security leaks by zeroing out the excess data .
*/
2017-01-27 11:46:29 +03:00
if ( unlikely ( rq - > resid_len > 0 & & rq - > resid_len < = bufflen ) )
memset ( buffer + ( bufflen - rq - > resid_len ) , 0 , rq - > resid_len ) ;
2008-06-24 22:03:14 +04:00
2008-12-04 08:24:39 +03:00
if ( resid )
2017-01-27 11:46:29 +03:00
* resid = rq - > resid_len ;
if ( sense & & rq - > sense_len )
memcpy ( sense , rq - > sense , SCSI_SENSE_BUFFERSIZE ) ;
2017-02-14 22:15:58 +03:00
if ( sshdr )
scsi_normalize_sense ( rq - > sense , rq - > sense_len , sshdr ) ;
2017-04-20 17:03:01 +03:00
ret = rq - > result ;
2005-06-16 03:48:29 +04:00
out :
2021-10-25 10:05:07 +03:00
blk_mq_free_request ( req ) ;
2005-06-16 03:48:29 +04:00
return ret ;
}
2018-07-31 22:51:54 +03:00
EXPORT_SYMBOL ( __scsi_execute ) ;
2005-06-16 03:48:29 +04:00
2017-12-04 21:06:23 +03:00
/*
2019-10-25 09:58:55 +03:00
* Wake up the error handler if necessary . Avoid as follows that the error
* handler is not woken up if host in - flight requests number = =
* shost - > host_failed : use call_rcu ( ) in scsi_eh_scmd_add ( ) in combination
* with an RCU read lock in this function to ensure that this function in
* its entirety either finishes before scsi_eh_scmd_add ( ) increases the
2017-12-04 21:06:23 +03:00
* host_failed counter or that it notices the shost state change made by
* scsi_eh_scmd_add ( ) .
*/
2019-10-25 09:58:55 +03:00
static void scsi_dec_host_busy ( struct Scsi_Host * shost , struct scsi_cmnd * cmd )
2005-04-17 02:20:36 +04:00
{
unsigned long flags ;
2017-12-04 21:06:23 +03:00
rcu_read_lock ( ) ;
2019-10-25 09:58:55 +03:00
__clear_bit ( SCMD_STATE_INFLIGHT , & cmd - > state ) ;
2017-12-04 21:06:23 +03:00
if ( unlikely ( scsi_host_in_recovery ( shost ) ) ) {
2014-01-22 18:29:29 +04:00
spin_lock_irqsave ( shost - > host_lock , flags ) ;
2017-12-04 21:06:23 +03:00
if ( shost - > host_failed | | shost - > host_eh_scheduled )
scsi_eh_wakeup ( shost ) ;
2014-01-22 18:29:29 +04:00
spin_unlock_irqrestore ( shost - > host_lock , flags ) ;
}
2017-12-04 21:06:23 +03:00
rcu_read_unlock ( ) ;
}
2019-10-25 09:58:55 +03:00
void scsi_device_unbusy ( struct scsi_device * sdev , struct scsi_cmnd * cmd )
2017-12-04 21:06:23 +03:00
{
struct Scsi_Host * shost = sdev - > host ;
struct scsi_target * starget = scsi_target ( sdev ) ;
2019-10-25 09:58:55 +03:00
scsi_dec_host_busy ( shost , cmd ) ;
2017-12-04 21:06:23 +03:00
if ( starget - > can_queue > 0 )
atomic_dec ( & starget - > target_busy ) ;
2014-01-22 18:29:29 +04:00
2021-01-22 05:33:17 +03:00
sbitmap_put ( & sdev - > budget_map , cmd - > budget_token ) ;
2021-01-22 05:33:12 +03:00
cmd - > budget_token = - 1 ;
2005-04-17 02:20:36 +04:00
}
2014-01-17 15:06:53 +04:00
static void scsi_kick_queue ( struct request_queue * q )
{
2018-11-02 01:36:27 +03:00
blk_mq_run_hw_queues ( q , false ) ;
2014-01-17 15:06:53 +04:00
}
2005-04-17 02:20:36 +04:00
/*
* Called for single_lun devices on IO completion . Clear starget_sdev_user ,
* and call blk_run_queue for all the scsi_devices on the target -
* including current_sdev first .
*
* Called with * no * scsi locks held .
*/
static void scsi_single_lun_run ( struct scsi_device * current_sdev )
{
struct Scsi_Host * shost = current_sdev - > host ;
struct scsi_device * sdev , * tmp ;
struct scsi_target * starget = scsi_target ( current_sdev ) ;
unsigned long flags ;
spin_lock_irqsave ( shost - > host_lock , flags ) ;
starget - > starget_sdev_user = NULL ;
spin_unlock_irqrestore ( shost - > host_lock , flags ) ;
/*
* Call blk_run_queue for all LUNs on the target , starting with
* current_sdev . We race with others ( to set starget_sdev_user ) ,
* but in most cases , we will be first . Ideally , each LU on the
* target would get some limited time or requests on the target .
*/
2014-01-17 15:06:53 +04:00
scsi_kick_queue ( current_sdev - > request_queue ) ;
2005-04-17 02:20:36 +04:00
spin_lock_irqsave ( shost - > host_lock , flags ) ;
if ( starget - > starget_sdev_user )
goto out ;
list_for_each_entry_safe ( sdev , tmp , & starget - > devices ,
same_target_siblings ) {
if ( sdev = = current_sdev )
continue ;
if ( scsi_device_get ( sdev ) )
continue ;
spin_unlock_irqrestore ( shost - > host_lock , flags ) ;
2014-01-17 15:06:53 +04:00
scsi_kick_queue ( sdev - > request_queue ) ;
2005-04-17 02:20:36 +04:00
spin_lock_irqsave ( shost - > host_lock , flags ) ;
2020-06-19 18:41:17 +03:00
2005-04-17 02:20:36 +04:00
scsi_device_put ( sdev ) ;
}
out :
spin_unlock_irqrestore ( shost - > host_lock , flags ) ;
}
2014-01-23 15:07:41 +04:00
static inline bool scsi_device_is_busy ( struct scsi_device * sdev )
2008-10-04 22:11:06 +04:00
{
2021-01-22 05:33:15 +03:00
if ( scsi_device_busy ( sdev ) > = sdev - > queue_depth )
2014-01-23 15:07:41 +04:00
return true ;
if ( atomic_read ( & sdev - > device_blocked ) > 0 )
return true ;
return false ;
2008-10-04 22:11:06 +04:00
}
2014-01-23 15:07:41 +04:00
static inline bool scsi_target_is_busy ( struct scsi_target * starget )
[SCSI] Add helper code so transport classes/driver can control queueing (v3)
SCSI-ml manages the queueing limits for the device and host, but
does not do so at the target level. However something something similar
can come in userful when a driver is transitioning a transport object to
the the blocked state, becuase at that time we do not want to queue
io and we do not want the queuecommand to be called again.
The patch adds code similar to the exisiting SCSI_ML_*BUSY handlers.
You can now return SCSI_MLQUEUE_TARGET_BUSY when we hit
a transport level queueing issue like the hw cannot allocate some
resource at the iscsi session/connection level, or the target has temporarily
closed or shrunk the queueing window, or if we are transitioning
to the blocked state.
bnx2i, when they rework their firmware according to netdev
developers requests, will also need to be able to limit queueing at this
level. bnx2i will hook into libiscsi, but will allocate a scsi host per
netdevice/hba, so unlike pure software iscsi/iser which is allocating
a host per session, it cannot set the scsi_host->can_queue and return
SCSI_MLQUEUE_HOST_BUSY to reflect queueing limits on the transport.
The iscsi class/driver can also set a scsi_target->can_queue value which
reflects the max commands the driver/class can support. For iscsi this
reflects the number of commands we can support for each session due to
session/connection hw limits, driver limits, and to also reflect the
session/targets's queueing window.
Changes:
v1 - initial patch.
v2 - Fix scsi_run_queue handling of multiple blocked targets.
Previously we would break from the main loop if a device was added back on
the starved list. We now run over the list and check if any target is
blocked.
v3 - Rediff for scsi-misc.
Signed-off-by: Mike Christie <michaelc@cs.wisc.edu>
Signed-off-by: James Bottomley <James.Bottomley@HansenPartnership.com>
2008-08-18 00:24:38 +04:00
{
2014-03-26 13:35:00 +04:00
if ( starget - > can_queue > 0 ) {
if ( atomic_read ( & starget - > target_busy ) > = starget - > can_queue )
return true ;
if ( atomic_read ( & starget - > target_blocked ) > 0 )
return true ;
}
2014-01-23 15:07:41 +04:00
return false ;
[SCSI] Add helper code so transport classes/driver can control queueing (v3)
SCSI-ml manages the queueing limits for the device and host, but
does not do so at the target level. However something something similar
can come in userful when a driver is transitioning a transport object to
the the blocked state, becuase at that time we do not want to queue
io and we do not want the queuecommand to be called again.
The patch adds code similar to the exisiting SCSI_ML_*BUSY handlers.
You can now return SCSI_MLQUEUE_TARGET_BUSY when we hit
a transport level queueing issue like the hw cannot allocate some
resource at the iscsi session/connection level, or the target has temporarily
closed or shrunk the queueing window, or if we are transitioning
to the blocked state.
bnx2i, when they rework their firmware according to netdev
developers requests, will also need to be able to limit queueing at this
level. bnx2i will hook into libiscsi, but will allocate a scsi host per
netdevice/hba, so unlike pure software iscsi/iser which is allocating
a host per session, it cannot set the scsi_host->can_queue and return
SCSI_MLQUEUE_HOST_BUSY to reflect queueing limits on the transport.
The iscsi class/driver can also set a scsi_target->can_queue value which
reflects the max commands the driver/class can support. For iscsi this
reflects the number of commands we can support for each session due to
session/connection hw limits, driver limits, and to also reflect the
session/targets's queueing window.
Changes:
v1 - initial patch.
v2 - Fix scsi_run_queue handling of multiple blocked targets.
Previously we would break from the main loop if a device was added back on
the starved list. We now run over the list and check if any target is
blocked.
v3 - Rediff for scsi-misc.
Signed-off-by: Mike Christie <michaelc@cs.wisc.edu>
Signed-off-by: James Bottomley <James.Bottomley@HansenPartnership.com>
2008-08-18 00:24:38 +04:00
}
2014-01-23 15:07:41 +04:00
static inline bool scsi_host_is_busy ( struct Scsi_Host * shost )
2008-10-04 22:11:06 +04:00
{
2014-01-23 15:07:41 +04:00
if ( atomic_read ( & shost - > host_blocked ) > 0 )
return true ;
if ( shost - > host_self_blocked )
return true ;
return false ;
2008-10-04 22:11:06 +04:00
}
2014-02-21 02:20:54 +04:00
static void scsi_starved_list_run ( struct Scsi_Host * shost )
2005-04-17 02:20:36 +04:00
{
2008-11-11 22:42:35 +03:00
LIST_HEAD ( starved_list ) ;
2014-02-21 02:20:54 +04:00
struct scsi_device * sdev ;
2005-04-17 02:20:36 +04:00
unsigned long flags ;
spin_lock_irqsave ( shost - > host_lock , flags ) ;
2008-11-11 22:42:35 +03:00
list_splice_init ( & shost - > starved_list , & starved_list ) ;
while ( ! list_empty ( & starved_list ) ) {
2013-07-02 17:05:26 +04:00
struct request_queue * slq ;
2005-04-17 02:20:36 +04:00
/*
* As long as shost is accepting commands and we have
* starved queues , call blk_run_queue . scsi_request_fn
* drops the queue_lock and can add us back to the
* starved_list .
*
* host_lock protects the starved_list and starved_entry .
* scsi_request_fn must get the host_lock before checking
* or modifying starved_list or starved_entry .
*/
2008-11-11 22:42:35 +03:00
if ( scsi_host_is_busy ( shost ) )
[SCSI] Add helper code so transport classes/driver can control queueing (v3)
SCSI-ml manages the queueing limits for the device and host, but
does not do so at the target level. However something something similar
can come in userful when a driver is transitioning a transport object to
the the blocked state, becuase at that time we do not want to queue
io and we do not want the queuecommand to be called again.
The patch adds code similar to the exisiting SCSI_ML_*BUSY handlers.
You can now return SCSI_MLQUEUE_TARGET_BUSY when we hit
a transport level queueing issue like the hw cannot allocate some
resource at the iscsi session/connection level, or the target has temporarily
closed or shrunk the queueing window, or if we are transitioning
to the blocked state.
bnx2i, when they rework their firmware according to netdev
developers requests, will also need to be able to limit queueing at this
level. bnx2i will hook into libiscsi, but will allocate a scsi host per
netdevice/hba, so unlike pure software iscsi/iser which is allocating
a host per session, it cannot set the scsi_host->can_queue and return
SCSI_MLQUEUE_HOST_BUSY to reflect queueing limits on the transport.
The iscsi class/driver can also set a scsi_target->can_queue value which
reflects the max commands the driver/class can support. For iscsi this
reflects the number of commands we can support for each session due to
session/connection hw limits, driver limits, and to also reflect the
session/targets's queueing window.
Changes:
v1 - initial patch.
v2 - Fix scsi_run_queue handling of multiple blocked targets.
Previously we would break from the main loop if a device was added back on
the starved list. We now run over the list and check if any target is
blocked.
v3 - Rediff for scsi-misc.
Signed-off-by: Mike Christie <michaelc@cs.wisc.edu>
Signed-off-by: James Bottomley <James.Bottomley@HansenPartnership.com>
2008-08-18 00:24:38 +04:00
break ;
2008-11-11 22:42:35 +03:00
sdev = list_entry ( starved_list . next ,
struct scsi_device , starved_entry ) ;
list_del_init ( & sdev - > starved_entry ) ;
[SCSI] Add helper code so transport classes/driver can control queueing (v3)
SCSI-ml manages the queueing limits for the device and host, but
does not do so at the target level. However something something similar
can come in userful when a driver is transitioning a transport object to
the the blocked state, becuase at that time we do not want to queue
io and we do not want the queuecommand to be called again.
The patch adds code similar to the exisiting SCSI_ML_*BUSY handlers.
You can now return SCSI_MLQUEUE_TARGET_BUSY when we hit
a transport level queueing issue like the hw cannot allocate some
resource at the iscsi session/connection level, or the target has temporarily
closed or shrunk the queueing window, or if we are transitioning
to the blocked state.
bnx2i, when they rework their firmware according to netdev
developers requests, will also need to be able to limit queueing at this
level. bnx2i will hook into libiscsi, but will allocate a scsi host per
netdevice/hba, so unlike pure software iscsi/iser which is allocating
a host per session, it cannot set the scsi_host->can_queue and return
SCSI_MLQUEUE_HOST_BUSY to reflect queueing limits on the transport.
The iscsi class/driver can also set a scsi_target->can_queue value which
reflects the max commands the driver/class can support. For iscsi this
reflects the number of commands we can support for each session due to
session/connection hw limits, driver limits, and to also reflect the
session/targets's queueing window.
Changes:
v1 - initial patch.
v2 - Fix scsi_run_queue handling of multiple blocked targets.
Previously we would break from the main loop if a device was added back on
the starved list. We now run over the list and check if any target is
blocked.
v3 - Rediff for scsi-misc.
Signed-off-by: Mike Christie <michaelc@cs.wisc.edu>
Signed-off-by: James Bottomley <James.Bottomley@HansenPartnership.com>
2008-08-18 00:24:38 +04:00
if ( scsi_target_is_busy ( scsi_target ( sdev ) ) ) {
list_move_tail ( & sdev - > starved_entry ,
& shost - > starved_list ) ;
continue ;
}
2013-07-02 17:05:26 +04:00
/*
* Once we drop the host lock , a racing scsi_remove_device ( )
* call may remove the sdev from the starved list and destroy
* it and the queue . Mitigate by taking a reference to the
* queue and never touching the sdev again after we drop the
* host lock . Note : if __scsi_remove_device ( ) invokes
* blk_cleanup_queue ( ) before the queue is run from this
* function then blk_run_queue ( ) will return immediately since
* blk_cleanup_queue ( ) marks the queue with QUEUE_FLAG_DYING .
*/
slq = sdev - > request_queue ;
if ( ! blk_get_queue ( slq ) )
continue ;
spin_unlock_irqrestore ( shost - > host_lock , flags ) ;
2014-01-17 15:06:53 +04:00
scsi_kick_queue ( slq ) ;
2013-07-02 17:05:26 +04:00
blk_put_queue ( slq ) ;
spin_lock_irqsave ( shost - > host_lock , flags ) ;
2005-04-17 02:20:36 +04:00
}
2008-11-11 22:42:35 +03:00
/* put any unprocessed entries back */
list_splice ( & starved_list , & shost - > starved_list ) ;
2005-04-17 02:20:36 +04:00
spin_unlock_irqrestore ( shost - > host_lock , flags ) ;
2014-02-21 02:20:54 +04:00
}
2020-04-19 08:01:48 +03:00
/**
* scsi_run_queue - Select a proper request queue to serve next .
* @ q : last request ' s queue
2014-02-21 02:20:54 +04:00
*
2020-04-19 08:01:48 +03:00
* The previous command was completely finished , start a new one if possible .
2014-02-21 02:20:54 +04:00
*/
static void scsi_run_queue ( struct request_queue * q )
{
struct scsi_device * sdev = q - > queuedata ;
if ( scsi_target ( sdev ) - > single_lun )
scsi_single_lun_run ( sdev ) ;
if ( ! list_empty ( & sdev - > host - > starved_list ) )
scsi_starved_list_run ( sdev - > host ) ;
2005-04-17 02:20:36 +04:00
2018-11-02 01:36:27 +03:00
blk_mq_run_hw_queues ( q , false ) ;
2005-04-17 02:20:36 +04:00
}
2011-05-17 13:04:44 +04:00
void scsi_requeue_run_queue ( struct work_struct * work )
{
struct scsi_device * sdev ;
struct request_queue * q ;
sdev = container_of ( work , struct scsi_device , requeue_work ) ;
q = sdev - > request_queue ;
scsi_run_queue ( q ) ;
}
2005-04-17 02:20:36 +04:00
void scsi_run_host_queues ( struct Scsi_Host * shost )
{
struct scsi_device * sdev ;
shost_for_each_device ( sdev , shost )
scsi_run_queue ( sdev - > request_queue ) ;
}
2014-01-17 15:06:53 +04:00
static void scsi_uninit_cmd ( struct scsi_cmnd * cmd )
{
2021-08-10 02:03:05 +03:00
if ( ! blk_rq_is_passthrough ( scsi_cmd_to_rq ( cmd ) ) ) {
2014-01-17 15:06:53 +04:00
struct scsi_driver * drv = scsi_cmd_to_driver ( cmd ) ;
if ( drv - > uninit_command )
drv - > uninit_command ( cmd ) ;
}
}
2020-10-05 11:41:28 +03:00
void scsi_free_sgtables ( struct scsi_cmnd * cmd )
2014-01-17 15:06:53 +04:00
{
if ( cmd - > sdb . table . nents )
2019-04-28 10:39:32 +03:00
sg_free_table_chained ( & cmd - > sdb . table ,
SCSI_INLINE_SG_CNT ) ;
2014-01-17 15:06:53 +04:00
if ( scsi_prot_sg_count ( cmd ) )
2019-04-28 10:39:31 +03:00
sg_free_table_chained ( & cmd - > prot_sdb - > table ,
SCSI_INLINE_PROT_SG_CNT ) ;
2014-01-17 15:06:53 +04:00
}
2020-10-05 11:41:28 +03:00
EXPORT_SYMBOL_GPL ( scsi_free_sgtables ) ;
2014-01-17 15:06:53 +04:00
static void scsi_mq_uninit_cmd ( struct scsi_cmnd * cmd )
{
2020-04-28 13:45:55 +03:00
scsi_free_sgtables ( cmd ) ;
2014-01-17 15:06:53 +04:00
scsi_uninit_cmd ( cmd ) ;
}
2020-07-20 05:54:35 +03:00
static void scsi_run_queue_async ( struct scsi_device * sdev )
{
if ( scsi_target ( sdev ) - > single_lun | |
2020-09-10 10:50:56 +03:00
! list_empty ( & sdev - > host - > starved_list ) ) {
2020-07-20 05:54:35 +03:00
kblockd_schedule_work ( & sdev - > requeue_work ) ;
2020-09-10 10:50:56 +03:00
} else {
/*
* smp_mb ( ) present in sbitmap_queue_clear ( ) or implied in
* . end_io is for ordering writing . device_busy in
* scsi_device_unbusy ( ) and reading sdev - > restarts .
*/
int old = atomic_read ( & sdev - > restarts ) ;
/*
* - > restarts has to be kept as non - zero if new budget
* contention occurs .
*
* No need to run queue when either another re - run
* queue wins in updating - > restarts or a new budget
* contention occurs .
*/
if ( old & & atomic_cmpxchg ( & sdev - > restarts , old , 0 ) = = old )
blk_mq_run_hw_queues ( sdev - > request_queue , true ) ;
}
2020-07-20 05:54:35 +03:00
}
2018-06-23 13:22:14 +03:00
/* Returns false when no more bytes to process, true if there are more */
2017-06-03 10:38:04 +03:00
static bool scsi_end_request ( struct request * req , blk_status_t error ,
2019-01-29 11:33:07 +03:00
unsigned int bytes )
2014-02-16 18:16:13 +04:00
{
2017-08-25 23:46:32 +03:00
struct scsi_cmnd * cmd = blk_mq_rq_to_pdu ( req ) ;
2014-02-16 18:16:13 +04:00
struct scsi_device * sdev = cmd - > device ;
struct request_queue * q = sdev - > request_queue ;
if ( blk_update_request ( req , error , bytes ) )
return true ;
2021-11-26 15:18:00 +03:00
// XXX:
2014-02-16 18:16:13 +04:00
if ( blk_queue_add_random ( q ) )
2021-11-26 15:18:00 +03:00
add_disk_randomness ( req - > q - > disk ) ;
2014-02-16 18:16:13 +04:00
2021-06-24 15:39:34 +03:00
if ( ! blk_rq_is_passthrough ( req ) ) {
2017-08-31 02:58:39 +03:00
WARN_ON_ONCE ( ! ( cmd - > flags & SCMD_INITIALIZED ) ) ;
cmd - > flags & = ~ SCMD_INITIALIZED ;
}
2019-03-18 19:29:26 +03:00
/*
* Calling rcu_barrier ( ) is not necessary here because the
* SCSI error handler guarantees that the function called by
* call_rcu ( ) has been called before scsi_end_request ( ) is
* called .
*/
destroy_rcu_head ( & cmd - > rcu ) ;
2018-11-02 01:36:27 +03:00
/*
* In the MQ case the command gets freed by __blk_mq_end_request ,
* so we have to do all cleanup that depends on it earlier .
*
* We also can ' t kick the queues from irq context , so we
* will have to defer it to a workqueue .
*/
scsi_mq_uninit_cmd ( cmd ) ;
2014-09-16 18:41:13 +04:00
2018-11-19 01:46:03 +03:00
/*
* queue is still alive , so grab the ref for preventing it
* from being cleaned up during running queue .
*/
percpu_ref_get ( & q - > q_usage_counter ) ;
2014-09-16 18:41:13 +04:00
2018-11-02 01:36:27 +03:00
__blk_mq_end_request ( req , error ) ;
2014-01-17 15:06:53 +04:00
2020-07-20 05:54:35 +03:00
scsi_run_queue_async ( sdev ) ;
2014-02-16 18:16:13 +04:00
2018-11-19 01:46:03 +03:00
percpu_ref_put ( & q - > q_usage_counter ) ;
2014-02-16 18:16:13 +04:00
return false ;
}
2013-07-01 17:16:23 +04:00
/**
2018-04-05 20:33:00 +03:00
* scsi_result_to_blk_status - translate a SCSI result code into blk_status_t
* @ cmd : SCSI command
2013-07-01 17:16:23 +04:00
* @ result : scsi error code
*
2018-04-05 20:33:00 +03:00
* Translate a SCSI result code into a blk_status_t value . May reset the host
* byte of @ cmd - > result .
2013-07-01 17:16:23 +04:00
*/
2018-04-05 20:33:00 +03:00
static blk_status_t scsi_result_to_blk_status ( struct scsi_cmnd * cmd , int result )
2011-01-18 12:13:11 +03:00
{
2017-06-03 10:38:04 +03:00
switch ( host_byte ( result ) ) {
2018-04-05 20:33:01 +03:00
case DID_OK :
2021-04-27 11:30:44 +03:00
if ( scsi_status_is_good ( result ) )
2018-04-05 20:33:01 +03:00
return BLK_STS_OK ;
return BLK_STS_IOERR ;
2011-01-18 12:13:11 +03:00
case DID_TRANSPORT_FAILFAST :
2021-01-07 00:49:04 +03:00
case DID_TRANSPORT_MARGINAL :
2017-06-03 10:38:04 +03:00
return BLK_STS_TRANSPORT ;
2011-01-18 12:13:11 +03:00
case DID_TARGET_FAILURE :
2012-01-25 00:38:46 +04:00
set_host_byte ( cmd , DID_OK ) ;
2017-06-03 10:38:04 +03:00
return BLK_STS_TARGET ;
2011-01-18 12:13:11 +03:00
case DID_NEXUS_FAILURE :
2019-02-15 00:57:41 +03:00
set_host_byte ( cmd , DID_OK ) ;
2017-06-03 10:38:04 +03:00
return BLK_STS_NEXUS ;
2013-07-01 17:16:25 +04:00
case DID_ALLOC_FAILURE :
set_host_byte ( cmd , DID_OK ) ;
2017-06-03 10:38:04 +03:00
return BLK_STS_NOSPC ;
2013-07-01 17:16:26 +04:00
case DID_MEDIUM_ERROR :
set_host_byte ( cmd , DID_OK ) ;
2017-06-03 10:38:04 +03:00
return BLK_STS_MEDIUM ;
2011-01-18 12:13:11 +03:00
default :
2017-06-03 10:38:04 +03:00
return BLK_STS_IOERR ;
2011-01-18 12:13:11 +03:00
}
}
2021-11-17 09:13:54 +03:00
/**
* scsi_rq_err_bytes - determine number of bytes till the next failure boundary
* @ rq : request to examine
*
* Description :
* A request could be merge of IOs which require different failure
* handling . This function determines the number of bytes which
* can be failed from the beginning of the request without
* crossing into area which need to be retried further .
*
* Return :
* The number of bytes to fail .
*/
static unsigned int scsi_rq_err_bytes ( const struct request * rq )
{
unsigned int ff = rq - > cmd_flags & REQ_FAILFAST_MASK ;
unsigned int bytes = 0 ;
struct bio * bio ;
if ( ! ( rq - > rq_flags & RQF_MIXED_MERGE ) )
return blk_rq_bytes ( rq ) ;
/*
* Currently the only ' mixing ' which can happen is between
* different fastfail types . We can safely fail portions
* which have all the failfast bits that the first one has -
* the ones which are at least as eager to fail as the first
* one .
*/
for ( bio = rq - > bio ; bio ; bio = bio - > bi_next ) {
if ( ( bio - > bi_opf & ff ) ! = ff )
break ;
bytes + = bio - > bi_iter . bi_size ;
}
/* this could lead to infinite loop */
BUG_ON ( blk_rq_bytes ( rq ) & & ! bytes ) ;
return bytes ;
}
2018-06-23 13:22:18 +03:00
/* Helper for scsi_io_completion() when "reprep" action required. */
static void scsi_io_completion_reprep ( struct scsi_cmnd * cmd ,
struct request_queue * q )
{
/* A new command will be prepared and issued. */
2018-11-02 01:36:27 +03:00
scsi_mq_requeue_cmd ( cmd ) ;
2018-06-23 13:22:18 +03:00
}
2020-10-01 18:35:53 +03:00
static bool scsi_cmd_runtime_exceeced ( struct scsi_cmnd * cmd )
{
2021-08-10 02:03:05 +03:00
struct request * req = scsi_cmd_to_rq ( cmd ) ;
2020-10-01 18:35:53 +03:00
unsigned long wait_for ;
if ( cmd - > allowed = = SCSI_CMD_RETRIES_NO_LIMIT )
return false ;
wait_for = ( cmd - > allowed + 1 ) * req - > timeout ;
if ( time_before ( cmd - > jiffies_at_alloc + wait_for , jiffies ) ) {
scmd_printk ( KERN_ERR , cmd , " timing out command, waited %lus \n " ,
wait_for / HZ ) ;
return true ;
}
return false ;
}
2018-06-23 13:22:17 +03:00
/* Helper for scsi_io_completion() when special action required. */
static void scsi_io_completion_action ( struct scsi_cmnd * cmd , int result )
2005-04-17 02:20:36 +04:00
{
2007-07-24 11:28:11 +04:00
struct request_queue * q = cmd - > device - > request_queue ;
2021-08-10 02:03:05 +03:00
struct request * req = scsi_cmd_to_rq ( cmd ) ;
2018-06-23 13:22:17 +03:00
int level = 0 ;
2008-11-03 23:56:47 +03:00
enum { ACTION_FAIL , ACTION_REPREP , ACTION_RETRY ,
ACTION_DELAYED_RETRY } action ;
2018-06-23 13:22:17 +03:00
struct scsi_sense_hdr sshdr ;
bool sense_valid ;
bool sense_current = true ; /* false implies "deferred sense" */
blk_status_t blk_stat ;
2005-04-17 02:20:36 +04:00
2018-06-23 13:22:17 +03:00
sense_valid = scsi_command_normalize_sense ( cmd , & sshdr ) ;
if ( sense_valid )
sense_current = ! scsi_sense_is_deferred ( & sshdr ) ;
2006-06-23 20:39:09 +04:00
2018-06-23 13:22:17 +03:00
blk_stat = scsi_result_to_blk_status ( cmd , result ) ;
2009-01-04 11:04:31 +03:00
2008-11-03 23:56:47 +03:00
if ( host_byte ( result ) = = DID_RESET ) {
/* Third party bus reset or reset for error recovery
* reasons . Just retry the command and see what
* happens .
*/
action = ACTION_RETRY ;
2018-06-23 13:22:17 +03:00
} else if ( sense_valid & & sense_current ) {
2005-04-17 02:20:36 +04:00
switch ( sshdr . sense_key ) {
case UNIT_ATTENTION :
if ( cmd - > device - > removable ) {
2006-06-23 20:39:09 +04:00
/* Detected disc change. Set a bit
2005-04-17 02:20:36 +04:00
* and quietly refuse further access .
*/
cmd - > device - > changed = 1 ;
2008-11-03 23:56:47 +03:00
action = ACTION_FAIL ;
2005-04-17 02:20:36 +04:00
} else {
2006-06-23 20:39:09 +04:00
/* Must have been a power glitch, or a
* bus reset . Could not have been a
* media change , so we just retry the
2008-11-03 23:56:47 +03:00
* command and see what happens .
2006-06-23 20:39:09 +04:00
*/
2008-11-03 23:56:47 +03:00
action = ACTION_RETRY ;
2005-04-17 02:20:36 +04:00
}
break ;
case ILLEGAL_REQUEST :
2006-06-23 20:39:09 +04:00
/* If we had an ILLEGAL REQUEST returned, then
* we may have performed an unsupported
* command . The only thing this should be
* would be a ten byte read where only a six
* byte read was supported . Also , on a system
* where READ CAPACITY failed , we may have
* read past the end of the disk .
*/
2005-11-29 23:03:34 +03:00
if ( ( cmd - > device - > use_10_for_rw & &
sshdr . asc = = 0x20 & & sshdr . ascq = = 0x00 ) & &
2005-04-17 02:20:36 +04:00
( cmd - > cmnd [ 0 ] = = READ_10 | |
cmd - > cmnd [ 0 ] = = WRITE_10 ) ) {
2008-11-03 23:56:47 +03:00
/* This will issue a new 6-byte command. */
2005-04-17 02:20:36 +04:00
cmd - > device - > use_10_for_rw = 0 ;
2008-11-03 23:56:47 +03:00
action = ACTION_REPREP ;
2009-01-04 11:04:31 +03:00
} else if ( sshdr . asc = = 0x10 ) /* DIX */ {
action = ACTION_FAIL ;
2018-06-23 13:22:17 +03:00
blk_stat = BLK_STS_PROTECTION ;
2011-03-08 10:07:15 +03:00
/* INVALID COMMAND OPCODE or INVALID FIELD IN CDB */
2012-09-18 20:19:32 +04:00
} else if ( sshdr . asc = = 0x20 | | sshdr . asc = = 0x24 ) {
2011-03-08 10:07:15 +03:00
action = ACTION_FAIL ;
2018-06-23 13:22:17 +03:00
blk_stat = BLK_STS_TARGET ;
2008-11-03 23:56:47 +03:00
} else
action = ACTION_FAIL ;
break ;
2008-07-17 12:28:33 +04:00
case ABORTED_COMMAND :
2009-02-20 00:48:54 +03:00
action = ACTION_FAIL ;
2014-07-10 11:41:53 +04:00
if ( sshdr . asc = = 0x10 ) /* DIF */
2018-06-23 13:22:17 +03:00
blk_stat = BLK_STS_PROTECTION ;
2005-04-17 02:20:36 +04:00
break ;
case NOT_READY :
2006-06-23 20:39:09 +04:00
/* If the device is in the process of becoming
2006-04-26 01:48:30 +04:00
* ready , or has a temporary blockage , retry .
2005-04-17 02:20:36 +04:00
*/
2006-04-26 01:48:30 +04:00
if ( sshdr . asc = = 0x04 ) {
switch ( sshdr . ascq ) {
case 0x01 : /* becoming ready */
case 0x04 : /* format in progress */
case 0x05 : /* rebuild in progress */
case 0x06 : /* recalculation in progress */
case 0x07 : /* operation in progress */
case 0x08 : /* Long write in progress */
case 0x09 : /* self test in progress */
2021-06-29 18:58:26 +03:00
case 0x11 : /* notify (enable spinup) required */
2009-11-26 20:00:41 +03:00
case 0x14 : /* space allocation in progress */
2018-05-19 02:25:47 +03:00
case 0x1a : /* start stop unit in progress */
case 0x1b : /* sanitize in progress */
case 0x1d : /* configuration in progress */
case 0x24 : /* depopulation in progress */
2008-11-03 23:56:47 +03:00
action = ACTION_DELAYED_RETRY ;
2006-04-26 01:48:30 +04:00
break ;
2020-09-30 11:02:56 +03:00
case 0x0a : /* ALUA state transition */
blk_stat = BLK_STS_AGAIN ;
fallthrough ;
2008-12-15 18:31:28 +03:00
default :
action = ACTION_FAIL ;
break ;
2006-04-26 01:48:30 +04:00
}
2014-07-10 11:41:53 +04:00
} else
2008-11-03 23:56:47 +03:00
action = ACTION_FAIL ;
break ;
2005-04-17 02:20:36 +04:00
case VOLUME_OVERFLOW :
2006-06-23 20:39:09 +04:00
/* See SSC3rXX or current. */
2008-11-03 23:56:47 +03:00
action = ACTION_FAIL ;
break ;
2020-09-24 23:53:30 +03:00
case DATA_PROTECT :
action = ACTION_FAIL ;
if ( ( sshdr . asc = = 0x0C & & sshdr . ascq = = 0x12 ) | |
( sshdr . asc = = 0x55 & &
( sshdr . ascq = = 0x0E | | sshdr . ascq = = 0x0F ) ) ) {
/* Insufficient zone resources */
blk_stat = BLK_STS_ZONE_OPEN_RESOURCE ;
}
break ;
2005-04-17 02:20:36 +04:00
default :
2008-11-03 23:56:47 +03:00
action = ACTION_FAIL ;
2005-04-17 02:20:36 +04:00
break ;
}
2014-07-10 11:41:53 +04:00
} else
2008-11-03 23:56:47 +03:00
action = ACTION_FAIL ;
2020-10-01 18:35:53 +03:00
if ( action ! = ACTION_FAIL & & scsi_cmd_runtime_exceeced ( cmd ) )
2014-02-11 09:29:52 +04:00
action = ACTION_FAIL ;
2008-11-03 23:56:47 +03:00
switch ( action ) {
case ACTION_FAIL :
/* Give up and fail the remainder of the request */
2016-10-20 16:12:13 +03:00
if ( ! ( req - > rq_flags & RQF_QUIET ) ) {
2014-10-24 16:27:07 +04:00
static DEFINE_RATELIMIT_STATE ( _rs ,
DEFAULT_RATELIMIT_INTERVAL ,
DEFAULT_RATELIMIT_BURST ) ;
if ( unlikely ( scsi_logging_level ) )
2018-06-23 13:22:17 +03:00
level =
SCSI_LOG_LEVEL ( SCSI_LOG_MLCOMPLETE_SHIFT ,
SCSI_LOG_MLCOMPLETE_BITS ) ;
2014-10-24 16:27:07 +04:00
/*
* if logging is enabled the failure will be printed
* in scsi_log_completion ( ) , so avoid duplicate messages
*/
if ( ! level & & __ratelimit ( & _rs ) ) {
scsi_print_result ( cmd , NULL , FAILED ) ;
2021-04-27 11:30:15 +03:00
if ( sense_valid )
2014-10-24 16:27:07 +04:00
scsi_print_sense ( cmd ) ;
scsi_print_command ( cmd ) ;
}
2005-09-04 20:32:05 +04:00
}
2021-11-17 09:13:54 +03:00
if ( ! scsi_end_request ( req , blk_stat , scsi_rq_err_bytes ( req ) ) )
2014-02-16 18:16:13 +04:00
return ;
2020-08-24 01:36:59 +03:00
fallthrough ;
2008-11-03 23:56:47 +03:00
case ACTION_REPREP :
2018-06-23 13:22:18 +03:00
scsi_io_completion_reprep ( cmd , q ) ;
2008-11-03 23:56:47 +03:00
break ;
case ACTION_RETRY :
/* Retry the same command immediately */
2018-01-11 01:41:45 +03:00
__scsi_queue_insert ( cmd , SCSI_MLQUEUE_EH_RETRY , false ) ;
2008-11-03 23:56:47 +03:00
break ;
case ACTION_DELAYED_RETRY :
/* Retry the same command after a delay */
2018-01-11 01:41:45 +03:00
__scsi_queue_insert ( cmd , SCSI_MLQUEUE_DEVICE_BUSY , false ) ;
2008-11-03 23:56:47 +03:00
break ;
2005-04-17 02:20:36 +04:00
}
}
2018-06-23 13:22:16 +03:00
/*
* Helper for scsi_io_completion ( ) when cmd - > result is non - zero . Returns a
* new result that may suppress further error checking . Also modifies
* * blk_statp in some cases .
*/
static int scsi_io_completion_nz_result ( struct scsi_cmnd * cmd , int result ,
blk_status_t * blk_statp )
{
bool sense_valid ;
bool sense_current = true ; /* false implies "deferred sense" */
2021-08-10 02:03:05 +03:00
struct request * req = scsi_cmd_to_rq ( cmd ) ;
2018-06-23 13:22:16 +03:00
struct scsi_sense_hdr sshdr ;
sense_valid = scsi_command_normalize_sense ( cmd , & sshdr ) ;
if ( sense_valid )
sense_current = ! scsi_sense_is_deferred ( & sshdr ) ;
if ( blk_rq_is_passthrough ( req ) ) {
if ( sense_valid ) {
/*
* SG_IO wants current and deferred errors
*/
scsi_req ( req ) - > sense_len =
min ( 8 + cmd - > sense_buffer [ 7 ] ,
SCSI_SENSE_BUFFERSIZE ) ;
}
if ( sense_current )
* blk_statp = scsi_result_to_blk_status ( cmd , result ) ;
} else if ( blk_rq_bytes ( req ) = = 0 & & sense_current ) {
/*
* Flush commands do not transfers any data , and thus cannot use
* good_bytes ! = blk_rq_bytes ( req ) as the signal for an error .
* This sets * blk_statp explicitly for the problem case .
*/
* blk_statp = scsi_result_to_blk_status ( cmd , result ) ;
}
/*
* Recovered errors need reporting , but they ' re always treated as
* success , so fiddle the result code here . For passthrough requests
* we already took a copy of the original into sreq - > result which
* is what gets returned to the user
*/
if ( sense_valid & & ( sshdr . sense_key = = RECOVERED_ERROR ) ) {
bool do_print = true ;
/*
* if ATA PASS - THROUGH INFORMATION AVAILABLE [ 0x0 , 0x1d ]
* skip print since caller wants ATA registers . Only occurs
* on SCSI ATA PASS_THROUGH commands when CK_COND = 1
*/
if ( ( sshdr . asc = = 0x0 ) & & ( sshdr . ascq = = 0x1d ) )
do_print = false ;
else if ( req - > rq_flags & RQF_QUIET )
do_print = false ;
if ( do_print )
scsi_print_sense ( cmd ) ;
result = 0 ;
/* for passthrough, *blk_statp may be set */
* blk_statp = BLK_STS_OK ;
}
/*
* Another corner case : the SCSI status byte is non - zero but ' good ' .
* Example : PRE - FETCH command returns SAM_STAT_CONDITION_MET when
* it is able to fit nominated LBs in its cache ( and SAM_STAT_GOOD
* if it can ' t fit ) . Treat SAM_STAT_CONDITION_MET and the related
* intermediate statuses ( both obsolete in SAM - 4 ) as good .
*/
2021-04-27 11:30:46 +03:00
if ( ( result & 0xff ) & & scsi_status_is_good ( result ) ) {
2018-06-23 13:22:16 +03:00
result = 0 ;
* blk_statp = BLK_STS_OK ;
}
return result ;
}
2020-04-19 08:01:48 +03:00
/**
* scsi_io_completion - Completion processing for SCSI commands .
* @ cmd : command that is finished .
* @ good_bytes : number of processed bytes .
2005-04-17 02:20:36 +04:00
*
2020-04-19 08:01:48 +03:00
* We will finish off the specified number of sectors . If we are done , the
* command block will be released and the queue function will be goosed . If we
* are not done then we have to figure out what to do next :
2005-04-17 02:20:36 +04:00
*
2020-04-19 08:01:48 +03:00
* a ) We can call scsi_io_completion_reprep ( ) . The request will be
* unprepared and put back on the queue . Then a new command will
* be created for it . This should be used if we made forward
* progress , or if we want to switch from READ ( 10 ) to READ ( 6 ) for
* example .
2005-04-17 02:20:36 +04:00
*
2020-04-19 08:01:48 +03:00
* b ) We can call scsi_io_completion_action ( ) . The request will be
* put back on the queue and retried using the same command as
* before , possibly after a delay .
2008-11-03 23:56:47 +03:00
*
2020-04-19 08:01:48 +03:00
* c ) We can call scsi_end_request ( ) with blk_stat other than
* BLK_STS_OK , to fail the remainder of the request .
2005-04-17 02:20:36 +04:00
*/
2006-06-23 20:39:09 +04:00
void scsi_io_completion ( struct scsi_cmnd * cmd , unsigned int good_bytes )
2005-04-17 02:20:36 +04:00
{
int result = cmd - > result ;
2007-07-24 11:28:11 +04:00
struct request_queue * q = cmd - > device - > request_queue ;
2021-08-10 02:03:05 +03:00
struct request * req = scsi_cmd_to_rq ( cmd ) ;
2018-06-23 13:22:15 +03:00
blk_status_t blk_stat = BLK_STS_OK ;
2005-04-17 02:20:36 +04:00
2018-06-23 13:22:19 +03:00
if ( unlikely ( result ) ) /* a nz result may or may not be an error */
2018-06-23 13:22:16 +03:00
result = scsi_io_completion_nz_result ( cmd , result , & blk_stat ) ;
2006-07-08 22:42:15 +04:00
2018-06-23 13:22:19 +03:00
if ( unlikely ( blk_rq_is_passthrough ( req ) ) ) {
[SCSI] scsi_lib: fix scsi_io_completion's SG_IO error propagation
The following v3.4-rc1 commit unmasked an existing bug in scsi_io_completion's
SG_IO error handling: 47ac56d [SCSI] scsi_error: classify some ILLEGAL_REQUEST
sense as a permanent TARGET_ERROR
Given that certain ILLEGAL_REQUEST are now properly categorized as
TARGET_ERROR the host_byte is being set (before host_byte wasn't ever
set for these ILLEGAL_REQUEST).
In scsi_io_completion, initialize req->errors with cmd->result _after_
the SG_IO block that calls __scsi_error_from_host_byte (which may
modify the host_byte).
Before this fix:
cdb to send: 12 01 01 00 00 00
ioctl(3, SG_IO, {'S', SG_DXFER_NONE, cmd[6]=[12, 01, 01, 00, 00, 00],
mx_sb_len=32, iovec_count=0, dxfer_len=0, timeout=20000, flags=0,
status=02, masked_status=01, sb[19]=[70, 00, 05, 00, 00, 00, 00, 0b,
00, 00, 00, 00, 24, 00, 00, 00, 00, 00, 00], host_status=0x10,
driver_status=0x8, resid=0, duration=0, info=0x1}) = 0
SCSI Status: Check Condition
Sense Information:
sense buffer empty
After:
cdb to send: 12 01 01 00 00 00
ioctl(3, SG_IO, {'S', SG_DXFER_NONE, cmd[6]=[12, 01, 01, 00, 00, 00],
mx_sb_len=32, iovec_count=0, dxfer_len=0, timeout=20000, flags=0,
status=02, masked_status=01, sb[19]=[70, 00, 05, 00, 00, 00, 00, 0b,
00, 00, 00, 00, 24, 00, 00, 00, 00, 00, 00], host_status=0,
driver_status=0x8, resid=0, duration=0, info=0x1}) = 0
SCSI Status: Check Condition
Sense Information:
Fixed format, current; Sense key: Illegal Request
Additional sense: Invalid field in cdb
Raw sense data (in hex):
70 00 05 00 00 00 00 0b 00 00 00 00 24 00 00 00
00 00 00
Reported-by: Paolo Bonzini <pbonzini@redhat.com>
Tested-by: Paolo Bonzini <pbonzini@redhat.com>
Signed-off-by: Mike Snitzer <snitzer@redhat.com>
Reviewed-by: Babu Moger <babu.moger@netapp.com>
Cc: stable@vger.kernel.org # 3.4
Signed-off-by: James Bottomley <JBottomley@Parallels.com>
2012-05-31 23:05:33 +04:00
/*
2018-04-05 20:33:00 +03:00
* scsi_result_to_blk_status may have reset the host_byte
[SCSI] scsi_lib: fix scsi_io_completion's SG_IO error propagation
The following v3.4-rc1 commit unmasked an existing bug in scsi_io_completion's
SG_IO error handling: 47ac56d [SCSI] scsi_error: classify some ILLEGAL_REQUEST
sense as a permanent TARGET_ERROR
Given that certain ILLEGAL_REQUEST are now properly categorized as
TARGET_ERROR the host_byte is being set (before host_byte wasn't ever
set for these ILLEGAL_REQUEST).
In scsi_io_completion, initialize req->errors with cmd->result _after_
the SG_IO block that calls __scsi_error_from_host_byte (which may
modify the host_byte).
Before this fix:
cdb to send: 12 01 01 00 00 00
ioctl(3, SG_IO, {'S', SG_DXFER_NONE, cmd[6]=[12, 01, 01, 00, 00, 00],
mx_sb_len=32, iovec_count=0, dxfer_len=0, timeout=20000, flags=0,
status=02, masked_status=01, sb[19]=[70, 00, 05, 00, 00, 00, 00, 0b,
00, 00, 00, 00, 24, 00, 00, 00, 00, 00, 00], host_status=0x10,
driver_status=0x8, resid=0, duration=0, info=0x1}) = 0
SCSI Status: Check Condition
Sense Information:
sense buffer empty
After:
cdb to send: 12 01 01 00 00 00
ioctl(3, SG_IO, {'S', SG_DXFER_NONE, cmd[6]=[12, 01, 01, 00, 00, 00],
mx_sb_len=32, iovec_count=0, dxfer_len=0, timeout=20000, flags=0,
status=02, masked_status=01, sb[19]=[70, 00, 05, 00, 00, 00, 00, 0b,
00, 00, 00, 00, 24, 00, 00, 00, 00, 00, 00], host_status=0,
driver_status=0x8, resid=0, duration=0, info=0x1}) = 0
SCSI Status: Check Condition
Sense Information:
Fixed format, current; Sense key: Illegal Request
Additional sense: Invalid field in cdb
Raw sense data (in hex):
70 00 05 00 00 00 00 0b 00 00 00 00 24 00 00 00
00 00 00
Reported-by: Paolo Bonzini <pbonzini@redhat.com>
Tested-by: Paolo Bonzini <pbonzini@redhat.com>
Signed-off-by: Mike Snitzer <snitzer@redhat.com>
Reviewed-by: Babu Moger <babu.moger@netapp.com>
Cc: stable@vger.kernel.org # 3.4
Signed-off-by: James Bottomley <JBottomley@Parallels.com>
2012-05-31 23:05:33 +04:00
*/
2017-04-20 17:03:01 +03:00
scsi_req ( req ) - > result = cmd - > result ;
2018-06-23 13:22:20 +03:00
}
2007-12-13 14:47:40 +03:00
2005-04-17 02:20:36 +04:00
/*
* Next deal with any sectors which we were able to correctly
* handle .
*/
2014-06-25 18:39:59 +04:00
SCSI_LOG_HLCOMPLETE ( 1 , scmd_printk ( KERN_INFO , cmd ,
" %u sectors total, %d bytes done. \n " ,
blk_rq_sectors ( req ) , good_bytes ) ) ;
2006-07-02 19:06:28 +04:00
2009-03-30 20:55:51 +04:00
/*
2020-04-19 08:01:48 +03:00
* Failed , zero length commands always need to drop down
2018-06-23 13:22:15 +03:00
* to retry code . Fast path should return in this block .
2006-07-02 19:06:28 +04:00
*/
2018-06-23 13:22:19 +03:00
if ( likely ( blk_rq_bytes ( req ) > 0 | | blk_stat = = BLK_STS_OK ) ) {
2019-01-29 11:33:07 +03:00
if ( likely ( ! scsi_end_request ( req , blk_stat , good_bytes ) ) )
2018-06-23 13:22:15 +03:00
return ; /* no bytes remaining */
}
2014-05-01 18:51:03 +04:00
2018-06-23 13:22:19 +03:00
/* Kill remainder if no retries. */
if ( unlikely ( blk_stat & & scsi_noretry_cmd ( cmd ) ) ) {
2019-01-29 11:33:07 +03:00
if ( scsi_end_request ( req , blk_stat , blk_rq_bytes ( req ) ) )
2018-06-23 13:22:20 +03:00
WARN_ONCE ( true ,
" Bytes remaining after failed, no-retry command " ) ;
2014-02-16 18:16:13 +04:00
return ;
2014-05-01 18:51:03 +04:00
}
/*
* If there had been no error , but we have leftover bytes in the
2021-09-29 21:23:18 +03:00
* request just queue the command up again .
2006-07-02 19:06:28 +04:00
*/
2018-06-23 13:22:19 +03:00
if ( likely ( result = = 0 ) )
2018-06-23 13:22:18 +03:00
scsi_io_completion_reprep ( cmd , q ) ;
else
2018-06-23 13:22:17 +03:00
scsi_io_completion_action ( cmd , result ) ;
2005-04-17 02:20:36 +04:00
}
2020-04-14 10:42:24 +03:00
static inline bool scsi_cmd_needs_dma_drain ( struct scsi_device * sdev ,
struct request * rq )
2005-04-17 02:20:36 +04:00
{
2020-04-14 10:42:24 +03:00
return sdev - > dma_drain_len & & blk_rq_is_passthrough ( rq ) & &
! op_is_write ( req_op ( rq ) ) & &
sdev - > host - > hostt - > dma_need_drain ( rq ) ;
2005-04-17 02:20:36 +04:00
}
2007-12-13 14:50:53 +03:00
2020-04-19 08:01:48 +03:00
/**
2021-04-16 01:08:07 +03:00
* scsi_alloc_sgtables - Allocate and initialize data and integrity scatterlists
* @ cmd : SCSI command data structure to initialize .
*
* Initializes @ cmd - > sdb and also @ cmd - > prot_sdb if data integrity is enabled
* for @ cmd .
2007-12-13 14:50:53 +03:00
*
2020-04-19 08:01:48 +03:00
* Returns :
* * BLK_STS_OK - on success
* * BLK_STS_RESOURCE - if the failure is retryable
* * BLK_STS_IOERR - if the failure is fatal
2007-12-13 14:50:53 +03:00
*/
2020-10-05 11:41:28 +03:00
blk_status_t scsi_alloc_sgtables ( struct scsi_cmnd * cmd )
2007-12-13 14:50:53 +03:00
{
2020-04-14 10:42:24 +03:00
struct scsi_device * sdev = cmd - > device ;
2021-08-10 02:03:05 +03:00
struct request * rq = scsi_cmd_to_rq ( cmd ) ;
2020-04-14 10:42:24 +03:00
unsigned short nr_segs = blk_rq_nr_phys_segments ( rq ) ;
struct scatterlist * last_sg = NULL ;
2018-11-09 16:42:39 +03:00
blk_status_t ret ;
2020-04-14 10:42:24 +03:00
bool need_drain = scsi_cmd_needs_dma_drain ( sdev , rq ) ;
2020-04-14 10:42:23 +03:00
int count ;
2010-09-10 22:50:10 +04:00
2020-04-14 10:42:24 +03:00
if ( WARN_ON_ONCE ( ! nr_segs ) )
2018-11-09 16:42:39 +03:00
return BLK_STS_IOERR ;
2014-06-28 13:51:01 +04:00
2020-04-14 10:42:24 +03:00
/*
* Make sure there is space for the drain . The driver must adjust
* max_hw_segments to be prepared for this .
*/
if ( need_drain )
nr_segs + + ;
2020-04-14 10:42:23 +03:00
/*
* If sg table allocation fails , requeue request later .
*/
2020-04-14 10:42:24 +03:00
if ( unlikely ( sg_alloc_table_chained ( & cmd - > sdb . table , nr_segs ,
cmd - > sdb . table . sgl , SCSI_INLINE_SG_CNT ) ) )
2020-04-14 10:42:23 +03:00
return BLK_STS_RESOURCE ;
/*
* Next , walk the list , and fill in the addresses and sizes of
* each segment .
*/
2020-04-14 10:42:24 +03:00
count = __blk_rq_map_sg ( rq - > q , rq , cmd - > sdb . table . sgl , & last_sg ) ;
2020-04-14 10:42:25 +03:00
if ( blk_rq_bytes ( rq ) & rq - > q - > dma_pad_mask ) {
unsigned int pad_len =
( rq - > q - > dma_pad_mask & ~ blk_rq_bytes ( rq ) ) + 1 ;
last_sg - > length + = pad_len ;
cmd - > extra_len + = pad_len ;
}
2020-04-14 10:42:24 +03:00
if ( need_drain ) {
sg_unmark_end ( last_sg ) ;
last_sg = sg_next ( last_sg ) ;
sg_set_buf ( last_sg , sdev - > dma_drain_buf , sdev - > dma_drain_len ) ;
sg_mark_end ( last_sg ) ;
2020-04-14 10:42:25 +03:00
cmd - > extra_len + = sdev - > dma_drain_len ;
2020-04-14 10:42:24 +03:00
count + + ;
}
2020-04-14 10:42:23 +03:00
BUG_ON ( count > cmd - > sdb . table . nents ) ;
cmd - > sdb . table . nents = count ;
cmd - > sdb . length = blk_rq_payload_bytes ( rq ) ;
2007-12-13 14:50:53 +03:00
2010-09-10 22:50:10 +04:00
if ( blk_integrity_rq ( rq ) ) {
2008-07-18 01:08:48 +04:00
struct scsi_data_buffer * prot_sdb = cmd - > prot_sdb ;
2020-04-14 10:42:23 +03:00
int ivecs ;
2008-07-18 01:08:48 +04:00
2018-11-09 16:42:38 +03:00
if ( WARN_ON_ONCE ( ! prot_sdb ) ) {
2015-01-15 18:02:12 +03:00
/*
* This can happen if someone ( e . g . multipath )
* queues a command to a device on an adapter
* that does not support DIX .
*/
2018-11-09 16:42:39 +03:00
ret = BLK_STS_IOERR ;
2018-11-09 16:42:38 +03:00
goto out_free_sgtables ;
2015-01-15 18:02:12 +03:00
}
2010-09-10 22:50:10 +04:00
ivecs = blk_rq_count_integrity_sg ( rq - > q , rq - > bio ) ;
2008-07-18 01:08:48 +04:00
2016-04-05 00:48:09 +03:00
if ( sg_alloc_table_chained ( & prot_sdb - > table , ivecs ,
2019-04-28 10:39:30 +03:00
prot_sdb - > table . sgl ,
2019-04-28 10:39:31 +03:00
SCSI_INLINE_PROT_SG_CNT ) ) {
2018-11-09 16:42:39 +03:00
ret = BLK_STS_RESOURCE ;
2018-11-09 16:42:38 +03:00
goto out_free_sgtables ;
2008-07-18 01:08:48 +04:00
}
2010-09-10 22:50:10 +04:00
count = blk_rq_map_integrity_sg ( rq - > q , rq - > bio ,
2008-07-18 01:08:48 +04:00
prot_sdb - > table . sgl ) ;
2018-09-05 23:47:20 +03:00
BUG_ON ( count > ivecs ) ;
BUG_ON ( count > queue_max_integrity_segments ( rq - > q ) ) ;
2008-07-18 01:08:48 +04:00
cmd - > prot_sdb = prot_sdb ;
cmd - > prot_sdb - > table . nents = count ;
}
2018-11-09 16:42:39 +03:00
return BLK_STS_OK ;
2018-11-09 16:42:38 +03:00
out_free_sgtables :
2020-04-28 13:45:55 +03:00
scsi_free_sgtables ( cmd ) ;
2018-11-09 16:42:39 +03:00
return ret ;
2007-12-13 14:50:53 +03:00
}
2020-10-05 11:41:28 +03:00
EXPORT_SYMBOL ( scsi_alloc_sgtables ) ;
2005-04-17 02:20:36 +04:00
2017-06-20 21:15:41 +03:00
/**
2017-08-31 02:58:40 +03:00
* scsi_initialize_rq - initialize struct scsi_cmnd partially
2017-08-25 01:11:09 +03:00
* @ rq : Request associated with the SCSI command to be initialized .
2017-06-20 21:15:41 +03:00
*
2017-08-31 02:58:40 +03:00
* This function initializes the members of struct scsi_cmnd that must be
* initialized before request processing starts and that won ' t be
* reinitialized if a SCSI command is requeued .
2017-06-20 21:15:41 +03:00
*/
2017-12-08 02:59:31 +03:00
static void scsi_initialize_rq ( struct request * rq )
2017-06-20 21:15:41 +03:00
{
2017-06-20 21:15:42 +03:00
struct scsi_cmnd * cmd = blk_mq_rq_to_pdu ( rq ) ;
2021-07-24 10:20:24 +03:00
struct scsi_request * req = & cmd - > req ;
memset ( req - > __cmd , 0 , sizeof ( req - > __cmd ) ) ;
req - > cmd = req - > __cmd ;
req - > cmd_len = BLK_MAX_CDB ;
req - > sense_len = 0 ;
2017-06-20 21:15:42 +03:00
2018-02-22 22:30:20 +03:00
init_rcu_head ( & cmd - > rcu ) ;
2017-08-31 02:58:40 +03:00
cmd - > jiffies_at_alloc = jiffies ;
cmd - > retries = 0 ;
2017-06-20 21:15:41 +03:00
}
2021-10-21 09:06:05 +03:00
struct request * scsi_alloc_request ( struct request_queue * q ,
unsigned int op , blk_mq_req_flags_t flags )
{
struct request * rq ;
2021-10-25 10:05:07 +03:00
rq = blk_mq_alloc_request ( q , op , flags ) ;
2021-10-21 09:06:05 +03:00
if ( ! IS_ERR ( rq ) )
scsi_initialize_rq ( rq ) ;
return rq ;
}
EXPORT_SYMBOL_GPL ( scsi_alloc_request ) ;
2019-07-25 05:05:00 +03:00
/*
* Only called when the request isn ' t completed by SCSI , and not freed by
* SCSI
*/
static void scsi_cleanup_rq ( struct request * rq )
{
if ( rq - > rq_flags & RQF_DONTPREP ) {
scsi_mq_uninit_cmd ( blk_mq_rq_to_pdu ( rq ) ) ;
rq - > rq_flags & = ~ RQF_DONTPREP ;
}
}
2020-01-23 06:56:34 +03:00
/* Called before a request is prepared. See also scsi_mq_prep_fn(). */
2017-01-02 21:55:26 +03:00
void scsi_init_command ( struct scsi_device * dev , struct scsi_cmnd * cmd )
2006-11-04 22:10:55 +03:00
{
2017-01-02 21:55:26 +03:00
void * buf = cmd - > sense_buffer ;
void * prot = cmd - > prot_sdb ;
2021-08-10 02:03:05 +03:00
struct request * rq = scsi_cmd_to_rq ( cmd ) ;
2017-08-31 02:58:39 +03:00
unsigned int flags = cmd - > flags & SCMD_PRESERVED_FLAGS ;
2017-08-31 02:58:40 +03:00
unsigned long jiffies_at_alloc ;
2020-01-23 06:56:34 +03:00
int retries , to_clear ;
2019-10-25 09:58:55 +03:00
bool in_flight ;
2021-01-22 05:33:12 +03:00
int budget_token = cmd - > budget_token ;
2017-08-31 02:58:39 +03:00
2021-06-24 15:39:34 +03:00
if ( ! blk_rq_is_passthrough ( rq ) & & ! ( flags & SCMD_INITIALIZED ) ) {
2017-08-31 02:58:39 +03:00
flags | = SCMD_INITIALIZED ;
scsi_initialize_rq ( rq ) ;
}
2006-11-04 22:10:55 +03:00
2017-08-31 02:58:40 +03:00
jiffies_at_alloc = cmd - > jiffies_at_alloc ;
retries = cmd - > retries ;
2019-10-25 09:58:55 +03:00
in_flight = test_bit ( SCMD_STATE_INFLIGHT , & cmd - > state ) ;
2020-01-23 06:56:34 +03:00
/*
* Zero out the cmd , except for the embedded scsi_request . Only clear
* the driver - private command data if the LLD does not supply a
* function to initialize that data .
*/
to_clear = sizeof ( * cmd ) - sizeof ( cmd - > req ) ;
if ( ! dev - > host - > hostt - > init_cmd_priv )
to_clear + = dev - > host - > hostt - > cmd_size ;
memset ( ( char * ) cmd + sizeof ( cmd - > req ) , 0 , to_clear ) ;
2006-11-04 22:10:55 +03:00
2017-01-02 21:55:26 +03:00
cmd - > device = dev ;
cmd - > sense_buffer = buf ;
cmd - > prot_sdb = prot ;
2017-08-31 02:58:39 +03:00
cmd - > flags = flags ;
2021-10-29 22:43:10 +03:00
INIT_LIST_HEAD ( & cmd - > eh_entry ) ;
2017-01-02 21:55:26 +03:00
INIT_DELAYED_WORK ( & cmd - > abort_work , scmd_eh_abort_handler ) ;
2017-08-31 02:58:40 +03:00
cmd - > jiffies_at_alloc = jiffies_at_alloc ;
cmd - > retries = retries ;
2019-10-25 09:58:55 +03:00
if ( in_flight )
__set_bit ( SCMD_STATE_INFLIGHT , & cmd - > state ) ;
2021-01-22 05:33:12 +03:00
cmd - > budget_token = budget_token ;
2008-04-30 12:19:47 +04:00
2006-11-04 22:10:55 +03:00
}
2018-11-09 16:42:37 +03:00
static blk_status_t scsi_setup_scsi_cmnd ( struct scsi_device * sdev ,
struct request * req )
2005-12-16 05:17:02 +03:00
{
2017-08-25 23:46:32 +03:00
struct scsi_cmnd * cmd = blk_mq_rq_to_pdu ( req ) ;
2006-11-04 22:10:55 +03:00
/*
2017-01-31 18:57:31 +03:00
* Passthrough requests may transfer data , in which case they must
2006-11-04 22:10:55 +03:00
* a bio attached to them . Or they might contain a SCSI command
* that does not transfer data , in which case they may optionally
* submit a request without an attached bio .
*/
if ( req - > bio ) {
2020-10-05 11:41:28 +03:00
blk_status_t ret = scsi_alloc_sgtables ( cmd ) ;
2018-11-09 16:42:39 +03:00
if ( unlikely ( ret ! = BLK_STS_OK ) )
return ret ;
2006-11-04 22:10:55 +03:00
} else {
2009-05-07 17:24:42 +04:00
BUG_ON ( blk_rq_bytes ( req ) ) ;
2006-11-04 22:10:55 +03:00
2007-12-13 14:47:40 +03:00
memset ( & cmd - > sdb , 0 , sizeof ( cmd - > sdb ) ) ;
2006-11-04 22:10:55 +03:00
}
2005-12-16 05:17:02 +03:00
2017-01-27 11:46:29 +03:00
cmd - > cmd_len = scsi_req ( req ) - > cmd_len ;
cmd - > cmnd = scsi_req ( req ) - > cmd ;
2009-05-07 17:24:42 +04:00
cmd - > transfersize = blk_rq_bytes ( req ) ;
2017-04-05 20:18:12 +03:00
cmd - > allowed = scsi_req ( req ) - > retries ;
2018-11-09 16:42:37 +03:00
return BLK_STS_OK ;
2005-12-16 05:17:02 +03:00
}
2018-11-09 16:42:36 +03:00
static blk_status_t
2020-10-05 11:41:26 +03:00
scsi_device_state_check ( struct scsi_device * sdev , struct request * req )
2006-11-04 22:10:55 +03:00
{
2018-11-09 16:42:36 +03:00
switch ( sdev - > sdev_state ) {
2020-12-09 08:29:49 +03:00
case SDEV_CREATED :
return BLK_STS_OK ;
2018-11-09 16:42:36 +03:00
case SDEV_OFFLINE :
case SDEV_TRANSPORT_OFFLINE :
/*
* If the device is offline we refuse to process any
* commands . The device must be brought online
* before trying any recovery commands .
*/
2020-03-11 17:39:30 +03:00
if ( ! sdev - > offline_already ) {
sdev - > offline_already = true ;
sdev_printk ( KERN_ERR , sdev ,
" rejecting I/O to offline device \n " ) ;
}
2018-11-09 16:42:36 +03:00
return BLK_STS_IOERR ;
case SDEV_DEL :
/*
* If the device is fully deleted , we refuse to
* process any commands as well .
*/
sdev_printk ( KERN_ERR , sdev ,
" rejecting I/O to dead device \n " ) ;
return BLK_STS_IOERR ;
case SDEV_BLOCK :
case SDEV_CREATED_BLOCK :
return BLK_STS_RESOURCE ;
case SDEV_QUIESCE :
/*
2020-12-09 08:29:49 +03:00
* If the device is blocked we only accept power management
* commands .
2018-11-09 16:42:36 +03:00
*/
2020-12-09 08:29:49 +03:00
if ( req & & WARN_ON_ONCE ( ! ( req - > rq_flags & RQF_PM ) ) )
2018-11-09 16:42:36 +03:00
return BLK_STS_RESOURCE ;
return BLK_STS_OK ;
default :
/*
* For any other not fully online state we only allow
2020-12-09 08:29:49 +03:00
* power management commands .
2018-11-09 16:42:36 +03:00
*/
2020-12-09 08:29:49 +03:00
if ( req & & ! ( req - > rq_flags & RQF_PM ) )
2018-11-09 16:42:36 +03:00
return BLK_STS_IOERR ;
return BLK_STS_OK ;
2005-04-17 02:20:36 +04:00
}
2007-08-04 19:06:25 +04:00
}
2005-04-17 02:20:36 +04:00
/*
2021-01-22 05:33:17 +03:00
* scsi_dev_queue_ready : if we can send requests to sdev , assign one token
* and return the token else return - 1.
2005-04-17 02:20:36 +04:00
*/
static inline int scsi_dev_queue_ready ( struct request_queue * q ,
struct scsi_device * sdev )
{
2021-01-22 05:33:17 +03:00
int token ;
2014-04-11 21:07:01 +04:00
2021-01-22 05:33:17 +03:00
token = sbitmap_get ( & sdev - > budget_map ) ;
2014-01-23 15:07:41 +04:00
if ( atomic_read ( & sdev - > device_blocked ) ) {
2021-01-22 05:33:17 +03:00
if ( token < 0 )
goto out ;
if ( scsi_device_busy ( sdev ) > 1 )
2014-04-11 21:07:01 +04:00
goto out_dec ;
2005-04-17 02:20:36 +04:00
/*
* unblock after device_blocked iterates to zero
*/
2018-11-02 01:36:27 +03:00
if ( atomic_dec_return ( & sdev - > device_blocked ) > 0 )
2014-04-11 21:07:01 +04:00
goto out_dec ;
SCSI_LOG_MLQUEUE ( 3 , sdev_printk ( KERN_INFO , sdev ,
" unblocking device at zero depth \n " ) ) ;
2005-04-17 02:20:36 +04:00
}
2014-04-11 21:07:01 +04:00
2021-01-22 05:33:17 +03:00
return token ;
2014-04-11 21:07:01 +04:00
out_dec :
2021-01-22 05:33:17 +03:00
if ( token > = 0 )
sbitmap_put ( & sdev - > budget_map , token ) ;
out :
return - 1 ;
2005-04-17 02:20:36 +04:00
}
[SCSI] Add helper code so transport classes/driver can control queueing (v3)
SCSI-ml manages the queueing limits for the device and host, but
does not do so at the target level. However something something similar
can come in userful when a driver is transitioning a transport object to
the the blocked state, becuase at that time we do not want to queue
io and we do not want the queuecommand to be called again.
The patch adds code similar to the exisiting SCSI_ML_*BUSY handlers.
You can now return SCSI_MLQUEUE_TARGET_BUSY when we hit
a transport level queueing issue like the hw cannot allocate some
resource at the iscsi session/connection level, or the target has temporarily
closed or shrunk the queueing window, or if we are transitioning
to the blocked state.
bnx2i, when they rework their firmware according to netdev
developers requests, will also need to be able to limit queueing at this
level. bnx2i will hook into libiscsi, but will allocate a scsi host per
netdevice/hba, so unlike pure software iscsi/iser which is allocating
a host per session, it cannot set the scsi_host->can_queue and return
SCSI_MLQUEUE_HOST_BUSY to reflect queueing limits on the transport.
The iscsi class/driver can also set a scsi_target->can_queue value which
reflects the max commands the driver/class can support. For iscsi this
reflects the number of commands we can support for each session due to
session/connection hw limits, driver limits, and to also reflect the
session/targets's queueing window.
Changes:
v1 - initial patch.
v2 - Fix scsi_run_queue handling of multiple blocked targets.
Previously we would break from the main loop if a device was added back on
the starved list. We now run over the list and check if any target is
blocked.
v3 - Rediff for scsi-misc.
Signed-off-by: Mike Christie <michaelc@cs.wisc.edu>
Signed-off-by: James Bottomley <James.Bottomley@HansenPartnership.com>
2008-08-18 00:24:38 +04:00
/*
* scsi_target_queue_ready : checks if there we can send commands to target
* @ sdev : scsi device on starget to check .
*/
static inline int scsi_target_queue_ready ( struct Scsi_Host * shost ,
struct scsi_device * sdev )
{
struct scsi_target * starget = scsi_target ( sdev ) ;
2014-01-22 17:49:41 +04:00
unsigned int busy ;
[SCSI] Add helper code so transport classes/driver can control queueing (v3)
SCSI-ml manages the queueing limits for the device and host, but
does not do so at the target level. However something something similar
can come in userful when a driver is transitioning a transport object to
the the blocked state, becuase at that time we do not want to queue
io and we do not want the queuecommand to be called again.
The patch adds code similar to the exisiting SCSI_ML_*BUSY handlers.
You can now return SCSI_MLQUEUE_TARGET_BUSY when we hit
a transport level queueing issue like the hw cannot allocate some
resource at the iscsi session/connection level, or the target has temporarily
closed or shrunk the queueing window, or if we are transitioning
to the blocked state.
bnx2i, when they rework their firmware according to netdev
developers requests, will also need to be able to limit queueing at this
level. bnx2i will hook into libiscsi, but will allocate a scsi host per
netdevice/hba, so unlike pure software iscsi/iser which is allocating
a host per session, it cannot set the scsi_host->can_queue and return
SCSI_MLQUEUE_HOST_BUSY to reflect queueing limits on the transport.
The iscsi class/driver can also set a scsi_target->can_queue value which
reflects the max commands the driver/class can support. For iscsi this
reflects the number of commands we can support for each session due to
session/connection hw limits, driver limits, and to also reflect the
session/targets's queueing window.
Changes:
v1 - initial patch.
v2 - Fix scsi_run_queue handling of multiple blocked targets.
Previously we would break from the main loop if a device was added back on
the starved list. We now run over the list and check if any target is
blocked.
v3 - Rediff for scsi-misc.
Signed-off-by: Mike Christie <michaelc@cs.wisc.edu>
Signed-off-by: James Bottomley <James.Bottomley@HansenPartnership.com>
2008-08-18 00:24:38 +04:00
if ( starget - > single_lun ) {
2014-01-22 17:49:41 +04:00
spin_lock_irq ( shost - > host_lock ) ;
[SCSI] Add helper code so transport classes/driver can control queueing (v3)
SCSI-ml manages the queueing limits for the device and host, but
does not do so at the target level. However something something similar
can come in userful when a driver is transitioning a transport object to
the the blocked state, becuase at that time we do not want to queue
io and we do not want the queuecommand to be called again.
The patch adds code similar to the exisiting SCSI_ML_*BUSY handlers.
You can now return SCSI_MLQUEUE_TARGET_BUSY when we hit
a transport level queueing issue like the hw cannot allocate some
resource at the iscsi session/connection level, or the target has temporarily
closed or shrunk the queueing window, or if we are transitioning
to the blocked state.
bnx2i, when they rework their firmware according to netdev
developers requests, will also need to be able to limit queueing at this
level. bnx2i will hook into libiscsi, but will allocate a scsi host per
netdevice/hba, so unlike pure software iscsi/iser which is allocating
a host per session, it cannot set the scsi_host->can_queue and return
SCSI_MLQUEUE_HOST_BUSY to reflect queueing limits on the transport.
The iscsi class/driver can also set a scsi_target->can_queue value which
reflects the max commands the driver/class can support. For iscsi this
reflects the number of commands we can support for each session due to
session/connection hw limits, driver limits, and to also reflect the
session/targets's queueing window.
Changes:
v1 - initial patch.
v2 - Fix scsi_run_queue handling of multiple blocked targets.
Previously we would break from the main loop if a device was added back on
the starved list. We now run over the list and check if any target is
blocked.
v3 - Rediff for scsi-misc.
Signed-off-by: Mike Christie <michaelc@cs.wisc.edu>
Signed-off-by: James Bottomley <James.Bottomley@HansenPartnership.com>
2008-08-18 00:24:38 +04:00
if ( starget - > starget_sdev_user & &
2014-01-22 17:49:41 +04:00
starget - > starget_sdev_user ! = sdev ) {
spin_unlock_irq ( shost - > host_lock ) ;
return 0 ;
}
[SCSI] Add helper code so transport classes/driver can control queueing (v3)
SCSI-ml manages the queueing limits for the device and host, but
does not do so at the target level. However something something similar
can come in userful when a driver is transitioning a transport object to
the the blocked state, becuase at that time we do not want to queue
io and we do not want the queuecommand to be called again.
The patch adds code similar to the exisiting SCSI_ML_*BUSY handlers.
You can now return SCSI_MLQUEUE_TARGET_BUSY when we hit
a transport level queueing issue like the hw cannot allocate some
resource at the iscsi session/connection level, or the target has temporarily
closed or shrunk the queueing window, or if we are transitioning
to the blocked state.
bnx2i, when they rework their firmware according to netdev
developers requests, will also need to be able to limit queueing at this
level. bnx2i will hook into libiscsi, but will allocate a scsi host per
netdevice/hba, so unlike pure software iscsi/iser which is allocating
a host per session, it cannot set the scsi_host->can_queue and return
SCSI_MLQUEUE_HOST_BUSY to reflect queueing limits on the transport.
The iscsi class/driver can also set a scsi_target->can_queue value which
reflects the max commands the driver/class can support. For iscsi this
reflects the number of commands we can support for each session due to
session/connection hw limits, driver limits, and to also reflect the
session/targets's queueing window.
Changes:
v1 - initial patch.
v2 - Fix scsi_run_queue handling of multiple blocked targets.
Previously we would break from the main loop if a device was added back on
the starved list. We now run over the list and check if any target is
blocked.
v3 - Rediff for scsi-misc.
Signed-off-by: Mike Christie <michaelc@cs.wisc.edu>
Signed-off-by: James Bottomley <James.Bottomley@HansenPartnership.com>
2008-08-18 00:24:38 +04:00
starget - > starget_sdev_user = sdev ;
2014-01-22 17:49:41 +04:00
spin_unlock_irq ( shost - > host_lock ) ;
[SCSI] Add helper code so transport classes/driver can control queueing (v3)
SCSI-ml manages the queueing limits for the device and host, but
does not do so at the target level. However something something similar
can come in userful when a driver is transitioning a transport object to
the the blocked state, becuase at that time we do not want to queue
io and we do not want the queuecommand to be called again.
The patch adds code similar to the exisiting SCSI_ML_*BUSY handlers.
You can now return SCSI_MLQUEUE_TARGET_BUSY when we hit
a transport level queueing issue like the hw cannot allocate some
resource at the iscsi session/connection level, or the target has temporarily
closed or shrunk the queueing window, or if we are transitioning
to the blocked state.
bnx2i, when they rework their firmware according to netdev
developers requests, will also need to be able to limit queueing at this
level. bnx2i will hook into libiscsi, but will allocate a scsi host per
netdevice/hba, so unlike pure software iscsi/iser which is allocating
a host per session, it cannot set the scsi_host->can_queue and return
SCSI_MLQUEUE_HOST_BUSY to reflect queueing limits on the transport.
The iscsi class/driver can also set a scsi_target->can_queue value which
reflects the max commands the driver/class can support. For iscsi this
reflects the number of commands we can support for each session due to
session/connection hw limits, driver limits, and to also reflect the
session/targets's queueing window.
Changes:
v1 - initial patch.
v2 - Fix scsi_run_queue handling of multiple blocked targets.
Previously we would break from the main loop if a device was added back on
the starved list. We now run over the list and check if any target is
blocked.
v3 - Rediff for scsi-misc.
Signed-off-by: Mike Christie <michaelc@cs.wisc.edu>
Signed-off-by: James Bottomley <James.Bottomley@HansenPartnership.com>
2008-08-18 00:24:38 +04:00
}
2014-03-26 13:35:00 +04:00
if ( starget - > can_queue < = 0 )
return 1 ;
2014-01-22 17:49:41 +04:00
busy = atomic_inc_return ( & starget - > target_busy ) - 1 ;
2014-01-23 15:07:41 +04:00
if ( atomic_read ( & starget - > target_blocked ) > 0 ) {
2014-01-22 17:49:41 +04:00
if ( busy )
goto starved ;
[SCSI] Add helper code so transport classes/driver can control queueing (v3)
SCSI-ml manages the queueing limits for the device and host, but
does not do so at the target level. However something something similar
can come in userful when a driver is transitioning a transport object to
the the blocked state, becuase at that time we do not want to queue
io and we do not want the queuecommand to be called again.
The patch adds code similar to the exisiting SCSI_ML_*BUSY handlers.
You can now return SCSI_MLQUEUE_TARGET_BUSY when we hit
a transport level queueing issue like the hw cannot allocate some
resource at the iscsi session/connection level, or the target has temporarily
closed or shrunk the queueing window, or if we are transitioning
to the blocked state.
bnx2i, when they rework their firmware according to netdev
developers requests, will also need to be able to limit queueing at this
level. bnx2i will hook into libiscsi, but will allocate a scsi host per
netdevice/hba, so unlike pure software iscsi/iser which is allocating
a host per session, it cannot set the scsi_host->can_queue and return
SCSI_MLQUEUE_HOST_BUSY to reflect queueing limits on the transport.
The iscsi class/driver can also set a scsi_target->can_queue value which
reflects the max commands the driver/class can support. For iscsi this
reflects the number of commands we can support for each session due to
session/connection hw limits, driver limits, and to also reflect the
session/targets's queueing window.
Changes:
v1 - initial patch.
v2 - Fix scsi_run_queue handling of multiple blocked targets.
Previously we would break from the main loop if a device was added back on
the starved list. We now run over the list and check if any target is
blocked.
v3 - Rediff for scsi-misc.
Signed-off-by: Mike Christie <michaelc@cs.wisc.edu>
Signed-off-by: James Bottomley <James.Bottomley@HansenPartnership.com>
2008-08-18 00:24:38 +04:00
/*
* unblock after target_blocked iterates to zero
*/
2014-01-23 15:07:41 +04:00
if ( atomic_dec_return ( & starget - > target_blocked ) > 0 )
2014-01-22 17:49:41 +04:00
goto out_dec ;
2014-01-22 17:36:32 +04:00
SCSI_LOG_MLQUEUE ( 3 , starget_printk ( KERN_INFO , starget ,
" unblocking target at zero depth \n " ) ) ;
[SCSI] Add helper code so transport classes/driver can control queueing (v3)
SCSI-ml manages the queueing limits for the device and host, but
does not do so at the target level. However something something similar
can come in userful when a driver is transitioning a transport object to
the the blocked state, becuase at that time we do not want to queue
io and we do not want the queuecommand to be called again.
The patch adds code similar to the exisiting SCSI_ML_*BUSY handlers.
You can now return SCSI_MLQUEUE_TARGET_BUSY when we hit
a transport level queueing issue like the hw cannot allocate some
resource at the iscsi session/connection level, or the target has temporarily
closed or shrunk the queueing window, or if we are transitioning
to the blocked state.
bnx2i, when they rework their firmware according to netdev
developers requests, will also need to be able to limit queueing at this
level. bnx2i will hook into libiscsi, but will allocate a scsi host per
netdevice/hba, so unlike pure software iscsi/iser which is allocating
a host per session, it cannot set the scsi_host->can_queue and return
SCSI_MLQUEUE_HOST_BUSY to reflect queueing limits on the transport.
The iscsi class/driver can also set a scsi_target->can_queue value which
reflects the max commands the driver/class can support. For iscsi this
reflects the number of commands we can support for each session due to
session/connection hw limits, driver limits, and to also reflect the
session/targets's queueing window.
Changes:
v1 - initial patch.
v2 - Fix scsi_run_queue handling of multiple blocked targets.
Previously we would break from the main loop if a device was added back on
the starved list. We now run over the list and check if any target is
blocked.
v3 - Rediff for scsi-misc.
Signed-off-by: Mike Christie <michaelc@cs.wisc.edu>
Signed-off-by: James Bottomley <James.Bottomley@HansenPartnership.com>
2008-08-18 00:24:38 +04:00
}
2014-03-26 13:35:00 +04:00
if ( busy > = starget - > can_queue )
2014-01-22 17:49:41 +04:00
goto starved ;
[SCSI] Add helper code so transport classes/driver can control queueing (v3)
SCSI-ml manages the queueing limits for the device and host, but
does not do so at the target level. However something something similar
can come in userful when a driver is transitioning a transport object to
the the blocked state, becuase at that time we do not want to queue
io and we do not want the queuecommand to be called again.
The patch adds code similar to the exisiting SCSI_ML_*BUSY handlers.
You can now return SCSI_MLQUEUE_TARGET_BUSY when we hit
a transport level queueing issue like the hw cannot allocate some
resource at the iscsi session/connection level, or the target has temporarily
closed or shrunk the queueing window, or if we are transitioning
to the blocked state.
bnx2i, when they rework their firmware according to netdev
developers requests, will also need to be able to limit queueing at this
level. bnx2i will hook into libiscsi, but will allocate a scsi host per
netdevice/hba, so unlike pure software iscsi/iser which is allocating
a host per session, it cannot set the scsi_host->can_queue and return
SCSI_MLQUEUE_HOST_BUSY to reflect queueing limits on the transport.
The iscsi class/driver can also set a scsi_target->can_queue value which
reflects the max commands the driver/class can support. For iscsi this
reflects the number of commands we can support for each session due to
session/connection hw limits, driver limits, and to also reflect the
session/targets's queueing window.
Changes:
v1 - initial patch.
v2 - Fix scsi_run_queue handling of multiple blocked targets.
Previously we would break from the main loop if a device was added back on
the starved list. We now run over the list and check if any target is
blocked.
v3 - Rediff for scsi-misc.
Signed-off-by: Mike Christie <michaelc@cs.wisc.edu>
Signed-off-by: James Bottomley <James.Bottomley@HansenPartnership.com>
2008-08-18 00:24:38 +04:00
2014-01-22 17:49:41 +04:00
return 1 ;
starved :
spin_lock_irq ( shost - > host_lock ) ;
list_move_tail ( & sdev - > starved_entry , & shost - > starved_list ) ;
2014-01-22 17:36:32 +04:00
spin_unlock_irq ( shost - > host_lock ) ;
2014-01-22 17:49:41 +04:00
out_dec :
2014-03-26 13:35:00 +04:00
if ( starget - > can_queue > 0 )
atomic_dec ( & starget - > target_busy ) ;
2014-01-22 17:49:41 +04:00
return 0 ;
[SCSI] Add helper code so transport classes/driver can control queueing (v3)
SCSI-ml manages the queueing limits for the device and host, but
does not do so at the target level. However something something similar
can come in userful when a driver is transitioning a transport object to
the the blocked state, becuase at that time we do not want to queue
io and we do not want the queuecommand to be called again.
The patch adds code similar to the exisiting SCSI_ML_*BUSY handlers.
You can now return SCSI_MLQUEUE_TARGET_BUSY when we hit
a transport level queueing issue like the hw cannot allocate some
resource at the iscsi session/connection level, or the target has temporarily
closed or shrunk the queueing window, or if we are transitioning
to the blocked state.
bnx2i, when they rework their firmware according to netdev
developers requests, will also need to be able to limit queueing at this
level. bnx2i will hook into libiscsi, but will allocate a scsi host per
netdevice/hba, so unlike pure software iscsi/iser which is allocating
a host per session, it cannot set the scsi_host->can_queue and return
SCSI_MLQUEUE_HOST_BUSY to reflect queueing limits on the transport.
The iscsi class/driver can also set a scsi_target->can_queue value which
reflects the max commands the driver/class can support. For iscsi this
reflects the number of commands we can support for each session due to
session/connection hw limits, driver limits, and to also reflect the
session/targets's queueing window.
Changes:
v1 - initial patch.
v2 - Fix scsi_run_queue handling of multiple blocked targets.
Previously we would break from the main loop if a device was added back on
the starved list. We now run over the list and check if any target is
blocked.
v3 - Rediff for scsi-misc.
Signed-off-by: Mike Christie <michaelc@cs.wisc.edu>
Signed-off-by: James Bottomley <James.Bottomley@HansenPartnership.com>
2008-08-18 00:24:38 +04:00
}
2005-04-17 02:20:36 +04:00
/*
* scsi_host_queue_ready : if we can send requests to shost , return 1 else
* return 0. We must end up running the queue again whenever 0 is
* returned , else IO can hang .
*/
static inline int scsi_host_queue_ready ( struct request_queue * q ,
struct Scsi_Host * shost ,
2019-10-25 09:58:55 +03:00
struct scsi_device * sdev ,
struct scsi_cmnd * cmd )
2005-04-17 02:20:36 +04:00
{
2005-09-19 00:05:20 +04:00
if ( scsi_host_in_recovery ( shost ) )
2014-01-22 18:29:29 +04:00
return 0 ;
2014-01-23 15:07:41 +04:00
if ( atomic_read ( & shost - > host_blocked ) > 0 ) {
2019-10-25 09:58:55 +03:00
if ( scsi_host_busy ( shost ) > 0 )
2014-01-22 18:29:29 +04:00
goto starved ;
2005-04-17 02:20:36 +04:00
/*
* unblock after host_blocked iterates to zero
*/
2014-01-23 15:07:41 +04:00
if ( atomic_dec_return ( & shost - > host_blocked ) > 0 )
2014-01-22 18:29:29 +04:00
goto out_dec ;
2014-01-22 17:36:32 +04:00
SCSI_LOG_MLQUEUE ( 3 ,
shost_printk ( KERN_INFO , shost ,
" unblocking host at zero depth \n " ) ) ;
2005-04-17 02:20:36 +04:00
}
2014-01-22 18:29:29 +04:00
if ( shost - > host_self_blocked )
goto starved ;
2005-04-17 02:20:36 +04:00
/* We're OK to process the command, so we can't be starved */
2014-01-22 18:29:29 +04:00
if ( ! list_empty ( & sdev - > starved_entry ) ) {
spin_lock_irq ( shost - > host_lock ) ;
if ( ! list_empty ( & sdev - > starved_entry ) )
list_del_init ( & sdev - > starved_entry ) ;
spin_unlock_irq ( shost - > host_lock ) ;
}
2005-04-17 02:20:36 +04:00
2019-10-25 09:58:55 +03:00
__set_bit ( SCMD_STATE_INFLIGHT , & cmd - > state ) ;
2014-01-22 18:29:29 +04:00
return 1 ;
starved :
spin_lock_irq ( shost - > host_lock ) ;
if ( list_empty ( & sdev - > starved_entry ) )
list_add_tail ( & sdev - > starved_entry , & shost - > starved_list ) ;
2014-01-22 17:36:32 +04:00
spin_unlock_irq ( shost - > host_lock ) ;
2014-01-22 18:29:29 +04:00
out_dec :
2019-10-25 09:58:55 +03:00
scsi_dec_host_busy ( shost , cmd ) ;
2014-01-22 18:29:29 +04:00
return 0 ;
2005-04-17 02:20:36 +04:00
}
2008-10-04 22:11:35 +04:00
/*
* Busy state exporting function for request stacking drivers .
*
* For efficiency , no lock is taken to check the busy state of
* shost / starget / sdev , since the returned value is not guaranteed and
* may be changed after request stacking drivers call the function ,
* regardless of taking lock or not .
*
2012-06-29 19:33:22 +04:00
* When scsi can ' t dispatch I / Os anymore and needs to kill I / Os scsi
* needs to return ' not busy ' . Otherwise , request stacking drivers
* may hold requests forever .
2008-10-04 22:11:35 +04:00
*/
2018-11-02 01:36:27 +03:00
static bool scsi_mq_lld_busy ( struct request_queue * q )
2008-10-04 22:11:35 +04:00
{
struct scsi_device * sdev = q - > queuedata ;
struct Scsi_Host * shost ;
2012-11-28 16:42:38 +04:00
if ( blk_queue_dying ( q ) )
2018-11-02 01:36:27 +03:00
return false ;
2008-10-04 22:11:35 +04:00
shost = sdev - > host ;
2012-05-22 13:57:17 +04:00
/*
* Ignore host / starget busy state .
* Since block layer does not have a concept of fairness across
* multiple queues , congestion of host / starget needs to be handled
* in SCSI layer .
*/
if ( scsi_host_in_recovery ( shost ) | | scsi_device_is_busy ( sdev ) )
2018-11-02 01:36:27 +03:00
return true ;
2006-04-11 12:27:53 +04:00
2018-11-02 01:36:27 +03:00
return false ;
2005-04-17 02:20:36 +04:00
}
2021-04-16 01:08:09 +03:00
/*
* Block layer request completion callback . May be called from interrupt
* context .
*/
static void scsi_complete ( struct request * rq )
2006-01-09 18:03:03 +03:00
{
2017-08-25 23:46:32 +03:00
struct scsi_cmnd * cmd = blk_mq_rq_to_pdu ( rq ) ;
2021-04-16 01:08:11 +03:00
enum scsi_disposition disposition ;
2006-01-09 18:03:03 +03:00
INIT_LIST_HEAD ( & cmd - > eh_entry ) ;
2008-09-14 16:55:09 +04:00
atomic_inc ( & cmd - > device - > iodone_cnt ) ;
if ( cmd - > result )
atomic_inc ( & cmd - > device - > ioerr_cnt ) ;
2006-01-09 18:03:03 +03:00
disposition = scsi_decide_disposition ( cmd ) ;
2020-10-01 18:35:53 +03:00
if ( disposition ! = SUCCESS & & scsi_cmd_runtime_exceeced ( cmd ) )
2006-01-09 18:03:03 +03:00
disposition = SUCCESS ;
2014-06-25 18:39:59 +04:00
2006-01-09 18:03:03 +03:00
scsi_log_completion ( cmd , disposition ) ;
switch ( disposition ) {
2020-06-19 18:41:17 +03:00
case SUCCESS :
scsi_finish_command ( cmd ) ;
break ;
case NEEDS_RETRY :
scsi_queue_insert ( cmd , SCSI_MLQUEUE_EH_RETRY ) ;
break ;
case ADD_TO_MLQUEUE :
scsi_queue_insert ( cmd , SCSI_MLQUEUE_DEVICE_BUSY ) ;
break ;
default :
scsi_eh_scmd_add ( cmd ) ;
break ;
2006-01-09 18:03:03 +03:00
}
}
2014-09-06 05:23:07 +04:00
/**
2020-10-23 19:33:14 +03:00
* scsi_dispatch_cmd - Dispatch a command to the low - level driver .
2014-09-06 05:23:07 +04:00
* @ cmd : command block we are dispatching .
*
* Return : nonzero return request was rejected and device ' s queue needs to be
* plugged .
*/
static int scsi_dispatch_cmd ( struct scsi_cmnd * cmd )
{
struct Scsi_Host * host = cmd - > device - > host ;
int rtn = 0 ;
atomic_inc ( & cmd - > device - > iorequest_cnt ) ;
/* check if the device is still usable */
if ( unlikely ( cmd - > device - > sdev_state = = SDEV_DEL ) ) {
/* in SDEV_DEL we error all commands. DID_NO_CONNECT
* returns an immediate error upwards , and signals
* that the device is no longer present */
cmd - > result = DID_NO_CONNECT < < 16 ;
goto done ;
}
/* Check to see if the scsi lld made this device blocked. */
if ( unlikely ( scsi_device_blocked ( cmd - > device ) ) ) {
/*
* in blocked state , the command is just put back on
* the device queue . The suspend state has already
* blocked the queue so future requests should not
* occur until the device transitions out of the
* suspend state .
*/
SCSI_LOG_MLQUEUE ( 3 , scmd_printk ( KERN_INFO , cmd ,
" queuecommand : device blocked \n " ) ) ;
return SCSI_MLQUEUE_DEVICE_BUSY ;
}
/* Store the LUN value in cmnd, if needed. */
if ( cmd - > device - > lun_in_cdb )
cmd - > cmnd [ 1 ] = ( cmd - > cmnd [ 1 ] & 0x1f ) |
( cmd - > device - > lun < < 5 & 0xe0 ) ;
scsi_log_send ( cmd ) ;
/*
* Before we queue this command , check if the command
* length exceeds what the host adapter can handle .
*/
if ( cmd - > cmd_len > cmd - > device - > host - > max_cmd_len ) {
SCSI_LOG_MLQUEUE ( 3 , scmd_printk ( KERN_INFO , cmd ,
" queuecommand : command too long. "
" cdb_size=%d host->max_cmd_len=%d \n " ,
cmd - > cmd_len , cmd - > device - > host - > max_cmd_len ) ) ;
cmd - > result = ( DID_ABORT < < 16 ) ;
goto done ;
}
if ( unlikely ( host - > shost_state = = SHOST_DEL ) ) {
cmd - > result = ( DID_NO_CONNECT < < 16 ) ;
goto done ;
}
trace_scsi_dispatch_cmd_start ( cmd ) ;
rtn = host - > hostt - > queuecommand ( host , cmd ) ;
if ( rtn ) {
trace_scsi_dispatch_cmd_error ( cmd , rtn ) ;
if ( rtn ! = SCSI_MLQUEUE_DEVICE_BUSY & &
rtn ! = SCSI_MLQUEUE_TARGET_BUSY )
rtn = SCSI_MLQUEUE_HOST_BUSY ;
SCSI_LOG_MLQUEUE ( 3 , scmd_printk ( KERN_INFO , cmd ,
" queuecommand : request rejected \n " ) ) ;
}
return rtn ;
done :
2021-10-07 23:46:11 +03:00
scsi_done ( cmd ) ;
2014-09-06 05:23:07 +04:00
return 0 ;
}
2017-06-03 00:21:59 +03:00
/* Size in bytes of the sg-list stored in the scsi-mq command-private data. */
2019-04-28 10:39:32 +03:00
static unsigned int scsi_mq_inline_sgl_size ( struct Scsi_Host * shost )
2017-06-03 00:21:59 +03:00
{
2019-04-28 10:39:32 +03:00
return min_t ( unsigned int , shost - > sg_tablesize , SCSI_INLINE_SG_CNT ) *
2017-06-03 00:21:59 +03:00
sizeof ( struct scatterlist ) ;
}
2020-10-05 11:41:27 +03:00
static blk_status_t scsi_prepare_cmd ( struct request * req )
2014-01-17 15:06:53 +04:00
{
struct scsi_cmnd * cmd = blk_mq_rq_to_pdu ( req ) ;
struct scsi_device * sdev = req - > q - > queuedata ;
struct Scsi_Host * shost = sdev - > host ;
struct scatterlist * sg ;
2017-06-03 00:22:00 +03:00
scsi_init_command ( sdev , cmd ) ;
2014-01-17 15:06:53 +04:00
cmd - > prot_op = SCSI_PROT_NORMAL ;
2020-10-08 23:06:11 +03:00
if ( blk_rq_bytes ( req ) )
cmd - > sc_data_direction = rq_dma_dir ( req ) ;
else
cmd - > sc_data_direction = DMA_NONE ;
2014-01-17 15:06:53 +04:00
sg = ( void * ) cmd + sizeof ( struct scsi_cmnd ) + shost - > hostt - > cmd_size ;
cmd - > sdb . table . sgl = sg ;
if ( scsi_host_get_prot ( shost ) ) {
memset ( cmd - > prot_sdb , 0 , sizeof ( struct scsi_data_buffer ) ) ;
cmd - > prot_sdb - > table . sgl =
( struct scatterlist * ) ( cmd - > prot_sdb + 1 ) ;
}
2020-10-05 11:41:29 +03:00
/*
* Special handling for passthrough commands , which don ' t go to the ULP
* at all :
*/
2021-06-24 15:39:34 +03:00
if ( blk_rq_is_passthrough ( req ) )
2020-10-05 11:41:29 +03:00
return scsi_setup_scsi_cmnd ( sdev , req ) ;
if ( sdev - > handler & & sdev - > handler - > prep_fn ) {
blk_status_t ret = sdev - > handler - > prep_fn ( sdev , req ) ;
2014-09-22 17:59:31 +04:00
2020-10-05 11:41:29 +03:00
if ( ret ! = BLK_STS_OK )
return ret ;
}
cmd - > cmnd = scsi_req ( req ) - > cmd = scsi_req ( req ) - > __cmd ;
memset ( cmd - > cmnd , 0 , BLK_MAX_CDB ) ;
return scsi_cmd_to_driver ( cmd ) - > init_command ( cmd ) ;
2014-01-17 15:06:53 +04:00
}
2021-10-07 23:27:57 +03:00
void scsi_done ( struct scsi_cmnd * cmd )
2014-01-17 15:06:53 +04:00
{
2021-10-07 23:27:56 +03:00
switch ( cmd - > submitter ) {
case SUBMITTED_BY_BLOCK_LAYER :
break ;
case SUBMITTED_BY_SCSI_ERROR_HANDLER :
return scsi_eh_done ( cmd ) ;
case SUBMITTED_BY_SCSI_RESET_IOCTL :
return ;
}
2021-08-10 02:03:05 +03:00
if ( unlikely ( blk_should_fake_timeout ( scsi_cmd_to_rq ( cmd ) - > q ) ) )
2020-06-11 09:44:47 +03:00
return ;
2018-11-26 19:54:29 +03:00
if ( unlikely ( test_and_set_bit ( SCMD_STATE_COMPLETE , & cmd - > state ) ) )
return ;
2014-01-17 15:06:53 +04:00
trace_scsi_dispatch_cmd_done ( cmd ) ;
2021-08-10 02:03:05 +03:00
blk_mq_complete_request ( scsi_cmd_to_rq ( cmd ) ) ;
2014-01-17 15:06:53 +04:00
}
2021-10-07 23:27:57 +03:00
EXPORT_SYMBOL ( scsi_done ) ;
2014-01-17 15:06:53 +04:00
2021-01-22 05:33:12 +03:00
static void scsi_mq_put_budget ( struct request_queue * q , int budget_token )
2014-01-17 15:06:53 +04:00
{
2017-10-14 12:22:32 +03:00
struct scsi_device * sdev = q - > queuedata ;
2021-01-22 05:33:17 +03:00
sbitmap_put ( & sdev - > budget_map , budget_token ) ;
2017-10-14 12:22:32 +03:00
}
2021-01-22 05:33:12 +03:00
static int scsi_mq_get_budget ( struct request_queue * q )
2017-10-14 12:22:32 +03:00
{
2014-01-17 15:06:53 +04:00
struct scsi_device * sdev = q - > queuedata ;
2021-01-22 05:33:17 +03:00
int token = scsi_dev_queue_ready ( q , sdev ) ;
2014-01-17 15:06:53 +04:00
2021-01-22 05:33:17 +03:00
if ( token > = 0 )
return token ;
2020-09-10 10:50:56 +03:00
atomic_inc ( & sdev - > restarts ) ;
/*
* Orders atomic_inc ( & sdev - > restarts ) and atomic_read ( & sdev - > device_busy ) .
* . restarts must be incremented before . device_busy is read because the
* code in scsi_run_queue_async ( ) depends on the order of these operations .
*/
smp_mb__after_atomic ( ) ;
/*
* If all in - flight requests originated from this LUN are completed
* before reading . device_busy , sdev - > device_busy will be observed as
* zero , then blk_mq_delay_run_hw_queues ( ) will dispatch this request
* soon . Otherwise , completion of one of these requests will observe
* the . restarts flag , and the request queue will be run for handling
* this request , see scsi_end_request ( ) .
*/
2021-01-22 05:33:15 +03:00
if ( unlikely ( scsi_device_busy ( sdev ) = = 0 & &
2020-09-10 10:50:56 +03:00
! scsi_device_blocked ( sdev ) ) )
blk_mq_delay_run_hw_queues ( sdev - > request_queue , SCSI_QUEUE_DELAY ) ;
2021-01-22 05:33:12 +03:00
return - 1 ;
2017-10-14 12:22:32 +03:00
}
2021-01-22 05:33:11 +03:00
static void scsi_mq_set_rq_budget_token ( struct request * req , int token )
{
struct scsi_cmnd * cmd = blk_mq_rq_to_pdu ( req ) ;
cmd - > budget_token = token ;
}
static int scsi_mq_get_rq_budget_token ( struct request * req )
{
struct scsi_cmnd * cmd = blk_mq_rq_to_pdu ( req ) ;
return cmd - > budget_token ;
2017-10-14 12:22:32 +03:00
}
2017-06-03 10:38:05 +03:00
static blk_status_t scsi_queue_rq ( struct blk_mq_hw_ctx * hctx ,
2014-10-29 20:14:52 +03:00
const struct blk_mq_queue_data * bd )
2014-01-17 15:06:53 +04:00
{
2014-10-29 20:14:52 +03:00
struct request * req = bd - > rq ;
2014-01-17 15:06:53 +04:00
struct request_queue * q = req - > q ;
struct scsi_device * sdev = q - > queuedata ;
struct Scsi_Host * shost = sdev - > host ;
struct scsi_cmnd * cmd = blk_mq_rq_to_pdu ( req ) ;
2017-06-03 10:38:05 +03:00
blk_status_t ret ;
2014-01-17 15:06:53 +04:00
int reason ;
2021-01-22 05:33:12 +03:00
WARN_ON_ONCE ( cmd - > budget_token < 0 ) ;
2018-11-09 16:42:36 +03:00
/*
* If the device is not in running state we will reject some or all
* commands .
*/
if ( unlikely ( sdev - > sdev_state ! = SDEV_RUNNING ) ) {
2020-10-05 11:41:26 +03:00
ret = scsi_device_state_check ( sdev , req ) ;
2018-11-09 16:42:36 +03:00
if ( ret ! = BLK_STS_OK )
goto out_put_budget ;
}
2014-01-17 15:06:53 +04:00
2017-06-03 10:38:05 +03:00
ret = BLK_STS_RESOURCE ;
2014-01-17 15:06:53 +04:00
if ( ! scsi_target_queue_ready ( shost , sdev ) )
2017-11-04 04:55:34 +03:00
goto out_put_budget ;
2019-10-25 09:58:55 +03:00
if ( ! scsi_host_queue_ready ( q , shost , sdev , cmd ) )
2014-01-17 15:06:53 +04:00
goto out_dec_target_busy ;
2016-10-20 16:12:13 +03:00
if ( ! ( req - > rq_flags & RQF_DONTPREP ) ) {
2020-10-05 11:41:27 +03:00
ret = scsi_prepare_cmd ( req ) ;
2017-06-03 10:38:05 +03:00
if ( ret ! = BLK_STS_OK )
2014-01-17 15:06:53 +04:00
goto out_dec_host_busy ;
2016-10-20 16:12:13 +03:00
req - > rq_flags | = RQF_DONTPREP ;
2014-09-22 17:59:31 +04:00
} else {
2019-01-16 03:50:03 +03:00
clear_bit ( SCMD_STATE_COMPLETE , & cmd - > state ) ;
2014-01-17 15:06:53 +04:00
}
2019-05-30 14:28:10 +03:00
cmd - > flags & = SCMD_PRESERVED_FLAGS ;
2014-11-03 14:47:47 +03:00
if ( sdev - > simple_tags )
cmd - > flags | = SCMD_TAGGED ;
2019-05-30 14:28:10 +03:00
if ( bd - > last )
cmd - > flags | = SCMD_LAST ;
2014-10-19 19:13:58 +04:00
2020-10-05 11:41:22 +03:00
scsi_set_resid ( cmd , 0 ) ;
memset ( cmd - > sense_buffer , 0 , SCSI_SENSE_BUFFERSIZE ) ;
2021-10-07 23:27:56 +03:00
cmd - > submitter = SUBMITTED_BY_BLOCK_LAYER ;
2014-01-17 15:06:53 +04:00
2020-10-05 11:41:30 +03:00
blk_mq_start_request ( req ) ;
2014-01-17 15:06:53 +04:00
reason = scsi_dispatch_cmd ( cmd ) ;
if ( reason ) {
scsi_set_blocked ( cmd , reason ) ;
2017-06-03 10:38:05 +03:00
ret = BLK_STS_RESOURCE ;
2014-01-17 15:06:53 +04:00
goto out_dec_host_busy ;
}
2017-06-03 10:38:05 +03:00
return BLK_STS_OK ;
2014-01-17 15:06:53 +04:00
out_dec_host_busy :
2019-10-25 09:58:55 +03:00
scsi_dec_host_busy ( shost , cmd ) ;
2014-01-17 15:06:53 +04:00
out_dec_target_busy :
if ( scsi_target ( sdev ) - > can_queue > 0 )
atomic_dec ( & scsi_target ( sdev ) - > target_busy ) ;
2017-10-14 12:22:32 +03:00
out_put_budget :
2021-01-22 05:33:12 +03:00
scsi_mq_put_budget ( q , cmd - > budget_token ) ;
cmd - > budget_token = - 1 ;
2014-01-17 15:06:53 +04:00
switch ( ret ) {
2017-06-03 10:38:05 +03:00
case BLK_STS_OK :
break ;
case BLK_STS_RESOURCE :
2020-05-12 11:55:47 +03:00
case BLK_STS_ZONE_RESOURCE :
2020-12-02 13:04:19 +03:00
if ( scsi_device_blocked ( sdev ) )
2018-01-31 06:04:57 +03:00
ret = BLK_STS_DEV_RESOURCE ;
2014-01-17 15:06:53 +04:00
break ;
2020-09-30 11:02:54 +03:00
case BLK_STS_AGAIN :
scsi_req ( req ) - > result = DID_BUS_BUSY < < 16 ;
if ( req - > rq_flags & RQF_DONTPREP )
scsi_mq_uninit_cmd ( cmd ) ;
break ;
2017-06-03 10:38:05 +03:00
default :
2019-04-10 03:02:22 +03:00
if ( unlikely ( ! scsi_device_online ( sdev ) ) )
scsi_req ( req ) - > result = DID_NO_CONNECT < < 16 ;
else
scsi_req ( req ) - > result = DID_ERROR < < 16 ;
2014-01-17 15:06:53 +04:00
/*
2019-04-10 03:02:22 +03:00
* Make sure to release all allocated resources when
2014-01-17 15:06:53 +04:00
* we hit an error , as we will never see this command
* again .
*/
2016-10-20 16:12:13 +03:00
if ( req - > rq_flags & RQF_DONTPREP )
2014-01-17 15:06:53 +04:00
scsi_mq_uninit_cmd ( cmd ) ;
2020-07-20 05:54:35 +03:00
scsi_run_queue_async ( sdev ) ;
2014-01-17 15:06:53 +04:00
break ;
}
return ret ;
}
2014-09-14 03:40:13 +04:00
static enum blk_eh_timer_return scsi_timeout ( struct request * req ,
bool reserved )
{
if ( reserved )
return BLK_EH_RESET_TIMER ;
return scsi_times_out ( req ) ;
}
2017-08-25 23:46:31 +03:00
static int scsi_mq_init_request ( struct blk_mq_tag_set * set , struct request * rq ,
unsigned int hctx_idx , unsigned int numa_node )
2014-01-17 15:06:53 +04:00
{
2017-05-01 19:19:08 +03:00
struct Scsi_Host * shost = set - > driver_data ;
2014-01-17 15:06:53 +04:00
struct scsi_cmnd * cmd = blk_mq_rq_to_pdu ( rq ) ;
2017-06-03 00:22:00 +03:00
struct scatterlist * sg ;
2020-01-23 06:56:34 +03:00
int ret = 0 ;
2014-01-17 15:06:53 +04:00
2021-03-31 10:29:58 +03:00
cmd - > sense_buffer =
kmem_cache_alloc_node ( scsi_sense_cache , GFP_KERNEL , numa_node ) ;
2014-01-17 15:06:53 +04:00
if ( ! cmd - > sense_buffer )
return - ENOMEM ;
2017-01-27 11:46:29 +03:00
cmd - > req . sense = cmd - > sense_buffer ;
2017-06-03 00:22:00 +03:00
if ( scsi_host_get_prot ( shost ) ) {
sg = ( void * ) cmd + sizeof ( struct scsi_cmnd ) +
shost - > hostt - > cmd_size ;
2019-04-28 10:39:32 +03:00
cmd - > prot_sdb = ( void * ) sg + scsi_mq_inline_sgl_size ( shost ) ;
2017-06-03 00:22:00 +03:00
}
2020-01-23 06:56:34 +03:00
if ( shost - > hostt - > init_cmd_priv ) {
ret = shost - > hostt - > init_cmd_priv ( shost , cmd ) ;
if ( ret < 0 )
2021-03-31 10:29:58 +03:00
kmem_cache_free ( scsi_sense_cache , cmd - > sense_buffer ) ;
2020-01-23 06:56:34 +03:00
}
return ret ;
2014-01-17 15:06:53 +04:00
}
2017-08-25 23:46:31 +03:00
static void scsi_mq_exit_request ( struct blk_mq_tag_set * set , struct request * rq ,
unsigned int hctx_idx )
2014-01-17 15:06:53 +04:00
{
2020-01-23 06:56:34 +03:00
struct Scsi_Host * shost = set - > driver_data ;
2014-01-17 15:06:53 +04:00
struct scsi_cmnd * cmd = blk_mq_rq_to_pdu ( rq ) ;
2020-01-23 06:56:34 +03:00
if ( shost - > hostt - > exit_cmd_priv )
shost - > hostt - > exit_cmd_priv ( shost , cmd ) ;
2021-03-31 10:29:58 +03:00
kmem_cache_free ( scsi_sense_cache , cmd - > sense_buffer ) ;
2014-01-17 15:06:53 +04:00
}
2021-02-15 10:40:44 +03:00
2021-10-12 18:24:29 +03:00
static int scsi_mq_poll ( struct blk_mq_hw_ctx * hctx , struct io_comp_batch * iob )
2021-02-15 10:40:44 +03:00
{
2021-02-15 10:40:48 +03:00
struct Scsi_Host * shost = hctx - > driver_data ;
2021-02-15 10:40:44 +03:00
if ( shost - > hostt - > mq_poll )
return shost - > hostt - > mq_poll ( shost , hctx - > queue_num ) ;
return 0 ;
}
2021-02-15 10:40:48 +03:00
static int scsi_init_hctx ( struct blk_mq_hw_ctx * hctx , void * data ,
unsigned int hctx_idx )
{
struct Scsi_Host * shost = data ;
hctx - > driver_data = shost ;
return 0 ;
}
2016-11-01 17:12:48 +03:00
static int scsi_map_queues ( struct blk_mq_tag_set * set )
{
struct Scsi_Host * shost = container_of ( set , struct Scsi_Host , tag_set ) ;
if ( shost - > hostt - > map_queues )
return shost - > hostt - > map_queues ( shost ) ;
2019-03-12 04:00:28 +03:00
return blk_mq_map_queues ( & set - > map [ HCTX_TYPE_DEFAULT ] ) ;
2016-11-01 17:12:48 +03:00
}
2017-01-02 21:52:10 +03:00
void __scsi_init_queue ( struct Scsi_Host * shost , struct request_queue * q )
2005-04-17 02:20:36 +04:00
{
2012-04-12 09:50:38 +04:00
struct device * dev = shost - > dma_dev ;
2005-04-17 02:20:36 +04:00
2007-08-07 11:02:51 +04:00
/*
* this limit is imposed by hardware restrictions
*/
2010-02-26 08:20:39 +03:00
blk_queue_max_segments ( q , min_t ( unsigned short , shost - > sg_tablesize ,
2016-04-05 00:48:10 +03:00
SG_MAX_SEGMENTS ) ) ;
2007-08-07 11:02:51 +04:00
2010-09-10 22:50:10 +04:00
if ( scsi_host_prot_dma ( shost ) ) {
shost - > sg_prot_tablesize =
min_not_zero ( shost - > sg_prot_tablesize ,
( unsigned short ) SCSI_MAX_PROT_SG_SEGMENTS ) ;
BUG_ON ( shost - > sg_prot_tablesize < shost - > sg_tablesize ) ;
blk_queue_max_integrity_segments ( q , shost - > sg_prot_tablesize ) ;
}
2019-07-22 12:20:38 +03:00
if ( dev - > dma_mask ) {
shost - > max_sectors = min_t ( unsigned int , shost - > max_sectors ,
dma_max_mapping_size ( dev ) > > SECTOR_SHIFT ) ;
}
2010-02-26 08:20:38 +03:00
blk_queue_max_hw_sectors ( q , shost - > max_sectors ) ;
2005-04-17 02:20:36 +04:00
blk_queue_segment_boundary ( q , shost - > dma_boundary ) ;
2008-02-05 09:28:17 +03:00
dma_set_seg_boundary ( dev , shost - > dma_boundary ) ;
2005-04-17 02:20:36 +04:00
2019-01-16 19:12:15 +03:00
blk_queue_max_segment_size ( q , shost - > max_segment_size ) ;
2019-06-17 15:19:53 +03:00
blk_queue_virt_boundary ( q , shost - > virt_boundary_mask ) ;
dma_set_max_seg_size ( dev , queue_max_segment_size ( q ) ) ;
2008-01-01 19:00:10 +03:00
/*
2017-11-21 16:23:38 +03:00
* Set a reasonable default alignment : The larger of 32 - byte ( dword ) ,
* which is a common minimum for HBAs , and the minimum DMA alignment ,
* which is set by the platform .
*
* Devices that require a bigger alignment can increase it later .
2008-01-01 19:00:10 +03:00
*/
2017-11-21 16:23:38 +03:00
blk_queue_dma_alignment ( q , max ( 4 , dma_get_cache_alignment ( ) ) - 1 ) ;
2014-01-17 15:06:53 +04:00
}
2017-01-02 21:52:10 +03:00
EXPORT_SYMBOL_GPL ( __scsi_init_queue ) ;
2008-01-01 19:00:10 +03:00
2019-05-30 14:28:10 +03:00
static const struct blk_mq_ops scsi_mq_ops_no_commit = {
. get_budget = scsi_mq_get_budget ,
. put_budget = scsi_mq_put_budget ,
. queue_rq = scsi_queue_rq ,
2021-04-16 01:08:09 +03:00
. complete = scsi_complete ,
2019-05-30 14:28:10 +03:00
. timeout = scsi_timeout ,
# ifdef CONFIG_BLK_DEBUG_FS
. show_rq = scsi_show_rq ,
# endif
. init_request = scsi_mq_init_request ,
. exit_request = scsi_mq_exit_request ,
2019-08-07 17:49:47 +03:00
. cleanup_rq = scsi_cleanup_rq ,
2019-05-30 14:28:10 +03:00
. busy = scsi_mq_lld_busy ,
. map_queues = scsi_map_queues ,
2021-02-15 10:40:48 +03:00
. init_hctx = scsi_init_hctx ,
2021-02-15 10:40:44 +03:00
. poll = scsi_mq_poll ,
2021-01-22 05:33:11 +03:00
. set_rq_budget_token = scsi_mq_set_rq_budget_token ,
. get_rq_budget_token = scsi_mq_get_rq_budget_token ,
2019-05-30 14:28:10 +03:00
} ;
static void scsi_commit_rqs ( struct blk_mq_hw_ctx * hctx )
{
2021-02-15 10:40:48 +03:00
struct Scsi_Host * shost = hctx - > driver_data ;
2019-05-30 14:28:10 +03:00
shost - > hostt - > commit_rqs ( shost , hctx - > queue_num ) ;
}
2017-03-30 23:39:16 +03:00
static const struct blk_mq_ops scsi_mq_ops = {
2017-10-14 12:22:32 +03:00
. get_budget = scsi_mq_get_budget ,
. put_budget = scsi_mq_put_budget ,
2014-01-17 15:06:53 +04:00
. queue_rq = scsi_queue_rq ,
2019-05-30 14:28:10 +03:00
. commit_rqs = scsi_commit_rqs ,
2021-04-16 01:08:09 +03:00
. complete = scsi_complete ,
2014-09-14 03:40:13 +04:00
. timeout = scsi_timeout ,
2017-04-26 23:47:57 +03:00
# ifdef CONFIG_BLK_DEBUG_FS
. show_rq = scsi_show_rq ,
# endif
2017-08-25 23:46:31 +03:00
. init_request = scsi_mq_init_request ,
. exit_request = scsi_mq_exit_request ,
2019-07-25 05:05:00 +03:00
. cleanup_rq = scsi_cleanup_rq ,
2018-10-29 19:17:28 +03:00
. busy = scsi_mq_lld_busy ,
2016-11-01 17:12:48 +03:00
. map_queues = scsi_map_queues ,
2021-02-15 10:40:48 +03:00
. init_hctx = scsi_init_hctx ,
2021-02-15 10:40:44 +03:00
. poll = scsi_mq_poll ,
2021-01-22 05:33:11 +03:00
. set_rq_budget_token = scsi_mq_set_rq_budget_token ,
. get_rq_budget_token = scsi_mq_get_rq_budget_token ,
2014-01-17 15:06:53 +04:00
} ;
int scsi_mq_setup_tags ( struct Scsi_Host * shost )
{
2017-06-03 00:21:59 +03:00
unsigned int cmd_size , sgl_size ;
2020-05-18 10:47:32 +03:00
struct blk_mq_tag_set * tag_set = & shost - > tag_set ;
2014-01-17 15:06:53 +04:00
2019-11-05 05:49:10 +03:00
sgl_size = max_t ( unsigned int , sizeof ( struct scatterlist ) ,
scsi_mq_inline_sgl_size ( shost ) ) ;
2014-01-17 15:06:53 +04:00
cmd_size = sizeof ( struct scsi_cmnd ) + shost - > hostt - > cmd_size + sgl_size ;
if ( scsi_host_get_prot ( shost ) )
2019-04-28 10:39:31 +03:00
cmd_size + = sizeof ( struct scsi_data_buffer ) +
sizeof ( struct scatterlist ) * SCSI_INLINE_PROT_SG_CNT ;
2014-01-17 15:06:53 +04:00
2020-05-18 10:47:32 +03:00
memset ( tag_set , 0 , sizeof ( * tag_set ) ) ;
2019-05-30 14:28:10 +03:00
if ( shost - > hostt - > commit_rqs )
2020-05-18 10:47:32 +03:00
tag_set - > ops = & scsi_mq_ops ;
2019-05-30 14:28:10 +03:00
else
2020-05-18 10:47:32 +03:00
tag_set - > ops = & scsi_mq_ops_no_commit ;
tag_set - > nr_hw_queues = shost - > nr_hw_queues ? : 1 ;
2021-02-15 10:40:44 +03:00
tag_set - > nr_maps = shost - > nr_maps ? : 1 ;
2020-05-18 10:47:32 +03:00
tag_set - > queue_depth = shost - > can_queue ;
tag_set - > cmd_size = cmd_size ;
tag_set - > numa_node = NUMA_NO_NODE ;
tag_set - > flags = BLK_MQ_F_SHOULD_MERGE ;
tag_set - > flags | =
2015-01-24 00:18:00 +03:00
BLK_ALLOC_POLICY_TO_MQ_FLAG ( shost - > hostt - > tag_alloc_policy ) ;
2020-05-18 10:47:32 +03:00
tag_set - > driver_data = shost ;
2020-08-19 18:20:30 +03:00
if ( shost - > host_tagset )
tag_set - > flags | = BLK_MQ_F_TAG_HCTX_SHARED ;
2014-01-17 15:06:53 +04:00
2020-05-18 10:47:32 +03:00
return blk_mq_alloc_tag_set ( tag_set ) ;
2014-01-17 15:06:53 +04:00
}
void scsi_mq_destroy_tags ( struct Scsi_Host * shost )
{
blk_mq_free_tag_set ( & shost - > tag_set ) ;
}
2017-02-17 11:02:45 +03:00
/**
* scsi_device_from_queue - return sdev associated with a request_queue
* @ q : The request queue to return the sdev from
*
* Return the sdev associated with a request queue or NULL if the
* request_queue does not reference a SCSI device .
*/
struct scsi_device * scsi_device_from_queue ( struct request_queue * q )
{
struct scsi_device * sdev = NULL ;
2019-08-07 17:49:48 +03:00
if ( q - > mq_ops = = & scsi_mq_ops_no_commit | |
q - > mq_ops = = & scsi_mq_ops )
2017-02-17 11:02:45 +03:00
sdev = q - > queuedata ;
if ( ! sdev | | ! get_device ( & sdev - > sdev_gendev ) )
sdev = NULL ;
return sdev ;
}
2021-10-21 09:06:07 +03:00
/*
* pktcdvd should have been integrated into the SCSI layers , but for historical
* reasons like the old IDE driver it isn ' t . This export allows it to safely
* probe if a given device is a SCSI one and only attach to that .
*/
# ifdef CONFIG_CDROM_PKTCDVD_MODULE
EXPORT_SYMBOL_GPL ( scsi_device_from_queue ) ;
# endif
2017-02-17 11:02:45 +03:00
2020-04-19 08:01:48 +03:00
/**
* scsi_block_requests - Utility function used by low - level drivers to prevent
* further commands from being queued to the device .
* @ shost : host in question
2005-04-17 02:20:36 +04:00
*
2020-04-19 08:01:48 +03:00
* There is no timer nor any other means by which the requests get unblocked
* other than the low - level driver calling scsi_unblock_requests ( ) .
2005-04-17 02:20:36 +04:00
*/
void scsi_block_requests ( struct Scsi_Host * shost )
{
shost - > host_self_blocked = 1 ;
}
EXPORT_SYMBOL ( scsi_block_requests ) ;
2020-04-19 08:01:48 +03:00
/**
* scsi_unblock_requests - Utility function used by low - level drivers to allow
* further commands to be queued to the device .
* @ shost : host in question
2005-04-17 02:20:36 +04:00
*
2020-04-19 08:01:48 +03:00
* There is no timer nor any other means by which the requests get unblocked
* other than the low - level driver calling scsi_unblock_requests ( ) . This is done
* as an API function so that changes to the internals of the scsi mid - layer
* won ' t require wholesale changes to drivers that use this feature .
2005-04-17 02:20:36 +04:00
*/
void scsi_unblock_requests ( struct Scsi_Host * shost )
{
shost - > host_self_blocked = 0 ;
scsi_run_host_queues ( shost ) ;
}
EXPORT_SYMBOL ( scsi_unblock_requests ) ;
void scsi_exit_queue ( void )
{
2017-01-03 08:28:41 +03:00
kmem_cache_destroy ( scsi_sense_cache ) ;
2005-04-17 02:20:36 +04:00
}
2006-03-18 23:10:35 +03:00
/**
* scsi_mode_select - issue a mode select
* @ sdev : SCSI device to be queried
* @ pf : Page format bit ( 1 = = standard , 0 = = vendor specific )
* @ sp : Save page bit ( 0 = = don ' t save , 1 = = save )
* @ buffer : request buffer ( may not be smaller than eight bytes )
* @ len : length of request buffer .
* @ timeout : command timeout
* @ retries : number of retries before failing
* @ data : returns a structure abstracting the mode header data
2007-11-03 21:30:39 +03:00
* @ sshdr : place to put sense data ( or NULL if no sense to be collected ) .
2006-03-18 23:10:35 +03:00
* must be SCSI_SENSE_BUFFERSIZE big .
*
* Returns zero if successful ; negative error number or scsi
* status on error
*
*/
2021-09-29 12:17:44 +03:00
int scsi_mode_select ( struct scsi_device * sdev , int pf , int sp ,
unsigned char * buffer , int len , int timeout , int retries ,
struct scsi_mode_data * data , struct scsi_sense_hdr * sshdr )
2006-03-18 23:10:35 +03:00
{
unsigned char cmd [ 10 ] ;
unsigned char * real_buffer ;
int ret ;
memset ( cmd , 0 , sizeof ( cmd ) ) ;
cmd [ 1 ] = ( pf ? 0x10 : 0 ) | ( sp ? 0x01 : 0 ) ;
2021-08-20 10:02:54 +03:00
/*
* Use MODE SELECT ( 10 ) if the device asked for it or if the mode page
* and the mode select header cannot fit within the maximumm 255 bytes
* of the MODE SELECT ( 6 ) command .
*/
if ( sdev - > use_10_for_ms | |
len + 4 > 255 | |
data - > block_descriptor_length > 255 ) {
if ( len > 65535 - 8 )
2006-03-18 23:10:35 +03:00
return - EINVAL ;
real_buffer = kmalloc ( 8 + len , GFP_KERNEL ) ;
if ( ! real_buffer )
return - ENOMEM ;
memcpy ( real_buffer + 8 , buffer , len ) ;
len + = 8 ;
real_buffer [ 0 ] = 0 ;
real_buffer [ 1 ] = 0 ;
real_buffer [ 2 ] = data - > medium_type ;
real_buffer [ 3 ] = data - > device_specific ;
real_buffer [ 4 ] = data - > longlba ? 0x01 : 0 ;
real_buffer [ 5 ] = 0 ;
2021-08-20 10:02:54 +03:00
put_unaligned_be16 ( data - > block_descriptor_length ,
& real_buffer [ 6 ] ) ;
2006-03-18 23:10:35 +03:00
cmd [ 0 ] = MODE_SELECT_10 ;
2021-08-20 10:02:54 +03:00
put_unaligned_be16 ( len , & cmd [ 7 ] ) ;
2006-03-18 23:10:35 +03:00
} else {
2021-08-20 10:02:54 +03:00
if ( data - > longlba )
2006-03-18 23:10:35 +03:00
return - EINVAL ;
real_buffer = kmalloc ( 4 + len , GFP_KERNEL ) ;
if ( ! real_buffer )
return - ENOMEM ;
memcpy ( real_buffer + 4 , buffer , len ) ;
len + = 4 ;
real_buffer [ 0 ] = 0 ;
real_buffer [ 1 ] = data - > medium_type ;
real_buffer [ 2 ] = data - > device_specific ;
real_buffer [ 3 ] = data - > block_descriptor_length ;
cmd [ 0 ] = MODE_SELECT ;
cmd [ 4 ] = len ;
}
ret = scsi_execute_req ( sdev , cmd , DMA_TO_DEVICE , real_buffer , len ,
2008-12-04 08:24:39 +03:00
sshdr , timeout , retries , NULL ) ;
2006-03-18 23:10:35 +03:00
kfree ( real_buffer ) ;
return ret ;
}
EXPORT_SYMBOL_GPL ( scsi_mode_select ) ;
2005-04-17 02:20:36 +04:00
/**
2007-11-03 21:30:39 +03:00
* scsi_mode_sense - issue a mode sense , falling back from 10 to six bytes if necessary .
2005-08-28 20:27:01 +04:00
* @ sdev : SCSI device to be queried
scsi: core: Fix scsi_mode_sense() buffer length handling
Several problems exist with scsi_mode_sense() buffer length handling:
1) The allocation length field of the MODE SENSE(10) command is 16-bits,
occupying bytes 7 and 8 of the CDB. With this command, access to mode
pages larger than 255 bytes is thus possible. However, the CDB
allocation length field is set by assigning len to byte 8 only, thus
truncating buffer length larger than 255.
2) If scsi_mode_sense() is called with len smaller than 8 with
sdev->use_10_for_ms set, or smaller than 4 otherwise, the buffer length
is increased to 8 and 4 respectively, and the buffer is zero filled
with these increased values, thus corrupting the memory following the
buffer.
Fix these 2 problems by using put_unaligned_be16() to set the allocation
length field of MODE SENSE(10) CDB and by returning an error when len is
too small.
Furthermore, if len is larger than 255B, always try MODE SENSE(10) first,
even if the device driver did not set sdev->use_10_for_ms. In case of
invalid opcode error for MODE SENSE(10), access to mode pages larger than
255 bytes are not retried using MODE SENSE(6). To avoid buffer length
overflows for the MODE_SENSE(10) case, check that len is smaller than 65535
bytes.
While at it, also fix the folowing:
* Use get_unaligned_be16() to retrieve the mode data length and block
descriptor length fields of the mode sense reply header instead of using
an open coded calculation.
* Fix the kdoc dbd argument explanation: the DBD bit stands for Disable
Block Descriptor, which is the opposite of what the dbd argument
description was.
Link: https://lore.kernel.org/r/20210820070255.682775-2-damien.lemoal@wdc.com
Signed-off-by: Damien Le Moal <damien.lemoal@wdc.com>
Signed-off-by: Martin K. Petersen <martin.petersen@oracle.com>
2021-08-20 10:02:53 +03:00
* @ dbd : set to prevent mode sense from returning block descriptors
2005-04-17 02:20:36 +04:00
* @ modepage : mode page being requested
* @ buffer : request buffer ( may not be smaller than eight bytes )
* @ len : length of request buffer .
* @ timeout : command timeout
* @ retries : number of retries before failing
* @ data : returns a structure abstracting the mode header data
2007-11-03 21:30:39 +03:00
* @ sshdr : place to put sense data ( or NULL if no sense to be collected ) .
2005-08-28 20:27:01 +04:00
* must be SCSI_SENSE_BUFFERSIZE big .
2005-04-17 02:20:36 +04:00
*
2021-04-27 11:30:09 +03:00
* Returns zero if successful , or a negative error number on failure
2007-11-03 21:30:39 +03:00
*/
2005-04-17 02:20:36 +04:00
int
2005-08-28 20:27:01 +04:00
scsi_mode_sense ( struct scsi_device * sdev , int dbd , int modepage ,
2005-04-17 02:20:36 +04:00
unsigned char * buffer , int len , int timeout , int retries ,
2006-03-18 23:10:35 +03:00
struct scsi_mode_data * data , struct scsi_sense_hdr * sshdr )
{
2005-04-17 02:20:36 +04:00
unsigned char cmd [ 12 ] ;
int use_10_for_ms ;
int header_length ;
2015-06-12 17:12:48 +03:00
int result , retry_count = retries ;
2005-08-28 20:33:52 +04:00
struct scsi_sense_hdr my_sshdr ;
2005-04-17 02:20:36 +04:00
memset ( data , 0 , sizeof ( * data ) ) ;
memset ( & cmd [ 0 ] , 0 , 12 ) ;
2019-12-05 05:14:25 +03:00
dbd = sdev - > set_dbd_for_ms ? 8 : dbd ;
2005-04-17 02:20:36 +04:00
cmd [ 1 ] = dbd & 0x18 ; /* allows DBD and LLBA bits */
cmd [ 2 ] = modepage ;
2005-08-28 20:33:52 +04:00
/* caller might not be interested in sense, but we need it */
if ( ! sshdr )
sshdr = & my_sshdr ;
2005-04-17 02:20:36 +04:00
retry :
scsi: core: Fix scsi_mode_sense() buffer length handling
Several problems exist with scsi_mode_sense() buffer length handling:
1) The allocation length field of the MODE SENSE(10) command is 16-bits,
occupying bytes 7 and 8 of the CDB. With this command, access to mode
pages larger than 255 bytes is thus possible. However, the CDB
allocation length field is set by assigning len to byte 8 only, thus
truncating buffer length larger than 255.
2) If scsi_mode_sense() is called with len smaller than 8 with
sdev->use_10_for_ms set, or smaller than 4 otherwise, the buffer length
is increased to 8 and 4 respectively, and the buffer is zero filled
with these increased values, thus corrupting the memory following the
buffer.
Fix these 2 problems by using put_unaligned_be16() to set the allocation
length field of MODE SENSE(10) CDB and by returning an error when len is
too small.
Furthermore, if len is larger than 255B, always try MODE SENSE(10) first,
even if the device driver did not set sdev->use_10_for_ms. In case of
invalid opcode error for MODE SENSE(10), access to mode pages larger than
255 bytes are not retried using MODE SENSE(6). To avoid buffer length
overflows for the MODE_SENSE(10) case, check that len is smaller than 65535
bytes.
While at it, also fix the folowing:
* Use get_unaligned_be16() to retrieve the mode data length and block
descriptor length fields of the mode sense reply header instead of using
an open coded calculation.
* Fix the kdoc dbd argument explanation: the DBD bit stands for Disable
Block Descriptor, which is the opposite of what the dbd argument
description was.
Link: https://lore.kernel.org/r/20210820070255.682775-2-damien.lemoal@wdc.com
Signed-off-by: Damien Le Moal <damien.lemoal@wdc.com>
Signed-off-by: Martin K. Petersen <martin.petersen@oracle.com>
2021-08-20 10:02:53 +03:00
use_10_for_ms = sdev - > use_10_for_ms | | len > 255 ;
2005-04-17 02:20:36 +04:00
if ( use_10_for_ms ) {
scsi: core: Fix scsi_mode_sense() buffer length handling
Several problems exist with scsi_mode_sense() buffer length handling:
1) The allocation length field of the MODE SENSE(10) command is 16-bits,
occupying bytes 7 and 8 of the CDB. With this command, access to mode
pages larger than 255 bytes is thus possible. However, the CDB
allocation length field is set by assigning len to byte 8 only, thus
truncating buffer length larger than 255.
2) If scsi_mode_sense() is called with len smaller than 8 with
sdev->use_10_for_ms set, or smaller than 4 otherwise, the buffer length
is increased to 8 and 4 respectively, and the buffer is zero filled
with these increased values, thus corrupting the memory following the
buffer.
Fix these 2 problems by using put_unaligned_be16() to set the allocation
length field of MODE SENSE(10) CDB and by returning an error when len is
too small.
Furthermore, if len is larger than 255B, always try MODE SENSE(10) first,
even if the device driver did not set sdev->use_10_for_ms. In case of
invalid opcode error for MODE SENSE(10), access to mode pages larger than
255 bytes are not retried using MODE SENSE(6). To avoid buffer length
overflows for the MODE_SENSE(10) case, check that len is smaller than 65535
bytes.
While at it, also fix the folowing:
* Use get_unaligned_be16() to retrieve the mode data length and block
descriptor length fields of the mode sense reply header instead of using
an open coded calculation.
* Fix the kdoc dbd argument explanation: the DBD bit stands for Disable
Block Descriptor, which is the opposite of what the dbd argument
description was.
Link: https://lore.kernel.org/r/20210820070255.682775-2-damien.lemoal@wdc.com
Signed-off-by: Damien Le Moal <damien.lemoal@wdc.com>
Signed-off-by: Martin K. Petersen <martin.petersen@oracle.com>
2021-08-20 10:02:53 +03:00
if ( len < 8 | | len > 65535 )
return - EINVAL ;
2005-04-17 02:20:36 +04:00
cmd [ 0 ] = MODE_SENSE_10 ;
scsi: core: Fix scsi_mode_sense() buffer length handling
Several problems exist with scsi_mode_sense() buffer length handling:
1) The allocation length field of the MODE SENSE(10) command is 16-bits,
occupying bytes 7 and 8 of the CDB. With this command, access to mode
pages larger than 255 bytes is thus possible. However, the CDB
allocation length field is set by assigning len to byte 8 only, thus
truncating buffer length larger than 255.
2) If scsi_mode_sense() is called with len smaller than 8 with
sdev->use_10_for_ms set, or smaller than 4 otherwise, the buffer length
is increased to 8 and 4 respectively, and the buffer is zero filled
with these increased values, thus corrupting the memory following the
buffer.
Fix these 2 problems by using put_unaligned_be16() to set the allocation
length field of MODE SENSE(10) CDB and by returning an error when len is
too small.
Furthermore, if len is larger than 255B, always try MODE SENSE(10) first,
even if the device driver did not set sdev->use_10_for_ms. In case of
invalid opcode error for MODE SENSE(10), access to mode pages larger than
255 bytes are not retried using MODE SENSE(6). To avoid buffer length
overflows for the MODE_SENSE(10) case, check that len is smaller than 65535
bytes.
While at it, also fix the folowing:
* Use get_unaligned_be16() to retrieve the mode data length and block
descriptor length fields of the mode sense reply header instead of using
an open coded calculation.
* Fix the kdoc dbd argument explanation: the DBD bit stands for Disable
Block Descriptor, which is the opposite of what the dbd argument
description was.
Link: https://lore.kernel.org/r/20210820070255.682775-2-damien.lemoal@wdc.com
Signed-off-by: Damien Le Moal <damien.lemoal@wdc.com>
Signed-off-by: Martin K. Petersen <martin.petersen@oracle.com>
2021-08-20 10:02:53 +03:00
put_unaligned_be16 ( len , & cmd [ 7 ] ) ;
2005-04-17 02:20:36 +04:00
header_length = 8 ;
} else {
if ( len < 4 )
scsi: core: Fix scsi_mode_sense() buffer length handling
Several problems exist with scsi_mode_sense() buffer length handling:
1) The allocation length field of the MODE SENSE(10) command is 16-bits,
occupying bytes 7 and 8 of the CDB. With this command, access to mode
pages larger than 255 bytes is thus possible. However, the CDB
allocation length field is set by assigning len to byte 8 only, thus
truncating buffer length larger than 255.
2) If scsi_mode_sense() is called with len smaller than 8 with
sdev->use_10_for_ms set, or smaller than 4 otherwise, the buffer length
is increased to 8 and 4 respectively, and the buffer is zero filled
with these increased values, thus corrupting the memory following the
buffer.
Fix these 2 problems by using put_unaligned_be16() to set the allocation
length field of MODE SENSE(10) CDB and by returning an error when len is
too small.
Furthermore, if len is larger than 255B, always try MODE SENSE(10) first,
even if the device driver did not set sdev->use_10_for_ms. In case of
invalid opcode error for MODE SENSE(10), access to mode pages larger than
255 bytes are not retried using MODE SENSE(6). To avoid buffer length
overflows for the MODE_SENSE(10) case, check that len is smaller than 65535
bytes.
While at it, also fix the folowing:
* Use get_unaligned_be16() to retrieve the mode data length and block
descriptor length fields of the mode sense reply header instead of using
an open coded calculation.
* Fix the kdoc dbd argument explanation: the DBD bit stands for Disable
Block Descriptor, which is the opposite of what the dbd argument
description was.
Link: https://lore.kernel.org/r/20210820070255.682775-2-damien.lemoal@wdc.com
Signed-off-by: Damien Le Moal <damien.lemoal@wdc.com>
Signed-off-by: Martin K. Petersen <martin.petersen@oracle.com>
2021-08-20 10:02:53 +03:00
return - EINVAL ;
2005-04-17 02:20:36 +04:00
cmd [ 0 ] = MODE_SENSE ;
cmd [ 4 ] = len ;
header_length = 4 ;
}
memset ( buffer , 0 , len ) ;
2005-08-28 20:27:01 +04:00
result = scsi_execute_req ( sdev , cmd , DMA_FROM_DEVICE , buffer , len ,
2008-12-04 08:24:39 +03:00
sshdr , timeout , retries , NULL ) ;
2021-04-27 11:30:09 +03:00
if ( result < 0 )
return result ;
2005-04-17 02:20:36 +04:00
/* This code looks awful: what it's doing is making sure an
* ILLEGAL REQUEST sense return identifies the actual command
* byte as the problem . MODE_SENSE commands can return
* ILLEGAL REQUEST if the code page isn ' t supported */
2021-04-27 11:30:10 +03:00
if ( ! scsi_status_is_good ( result ) ) {
2021-04-27 11:30:15 +03:00
if ( scsi_sense_valid ( sshdr ) ) {
2005-08-28 20:33:52 +04:00
if ( ( sshdr - > sense_key = = ILLEGAL_REQUEST ) & &
( sshdr - > asc = = 0x20 ) & & ( sshdr - > ascq = = 0 ) ) {
2020-06-19 18:41:17 +03:00
/*
scsi: core: Fix scsi_mode_sense() buffer length handling
Several problems exist with scsi_mode_sense() buffer length handling:
1) The allocation length field of the MODE SENSE(10) command is 16-bits,
occupying bytes 7 and 8 of the CDB. With this command, access to mode
pages larger than 255 bytes is thus possible. However, the CDB
allocation length field is set by assigning len to byte 8 only, thus
truncating buffer length larger than 255.
2) If scsi_mode_sense() is called with len smaller than 8 with
sdev->use_10_for_ms set, or smaller than 4 otherwise, the buffer length
is increased to 8 and 4 respectively, and the buffer is zero filled
with these increased values, thus corrupting the memory following the
buffer.
Fix these 2 problems by using put_unaligned_be16() to set the allocation
length field of MODE SENSE(10) CDB and by returning an error when len is
too small.
Furthermore, if len is larger than 255B, always try MODE SENSE(10) first,
even if the device driver did not set sdev->use_10_for_ms. In case of
invalid opcode error for MODE SENSE(10), access to mode pages larger than
255 bytes are not retried using MODE SENSE(6). To avoid buffer length
overflows for the MODE_SENSE(10) case, check that len is smaller than 65535
bytes.
While at it, also fix the folowing:
* Use get_unaligned_be16() to retrieve the mode data length and block
descriptor length fields of the mode sense reply header instead of using
an open coded calculation.
* Fix the kdoc dbd argument explanation: the DBD bit stands for Disable
Block Descriptor, which is the opposite of what the dbd argument
description was.
Link: https://lore.kernel.org/r/20210820070255.682775-2-damien.lemoal@wdc.com
Signed-off-by: Damien Le Moal <damien.lemoal@wdc.com>
Signed-off-by: Martin K. Petersen <martin.petersen@oracle.com>
2021-08-20 10:02:53 +03:00
* Invalid command operation code : retry using
* MODE SENSE ( 6 ) if this was a MODE SENSE ( 10 )
* request , except if the request mode page is
* too large for MODE SENSE single byte
* allocation length field .
2005-04-17 02:20:36 +04:00
*/
2021-04-27 11:30:10 +03:00
if ( use_10_for_ms ) {
scsi: core: Fix scsi_mode_sense() buffer length handling
Several problems exist with scsi_mode_sense() buffer length handling:
1) The allocation length field of the MODE SENSE(10) command is 16-bits,
occupying bytes 7 and 8 of the CDB. With this command, access to mode
pages larger than 255 bytes is thus possible. However, the CDB
allocation length field is set by assigning len to byte 8 only, thus
truncating buffer length larger than 255.
2) If scsi_mode_sense() is called with len smaller than 8 with
sdev->use_10_for_ms set, or smaller than 4 otherwise, the buffer length
is increased to 8 and 4 respectively, and the buffer is zero filled
with these increased values, thus corrupting the memory following the
buffer.
Fix these 2 problems by using put_unaligned_be16() to set the allocation
length field of MODE SENSE(10) CDB and by returning an error when len is
too small.
Furthermore, if len is larger than 255B, always try MODE SENSE(10) first,
even if the device driver did not set sdev->use_10_for_ms. In case of
invalid opcode error for MODE SENSE(10), access to mode pages larger than
255 bytes are not retried using MODE SENSE(6). To avoid buffer length
overflows for the MODE_SENSE(10) case, check that len is smaller than 65535
bytes.
While at it, also fix the folowing:
* Use get_unaligned_be16() to retrieve the mode data length and block
descriptor length fields of the mode sense reply header instead of using
an open coded calculation.
* Fix the kdoc dbd argument explanation: the DBD bit stands for Disable
Block Descriptor, which is the opposite of what the dbd argument
description was.
Link: https://lore.kernel.org/r/20210820070255.682775-2-damien.lemoal@wdc.com
Signed-off-by: Damien Le Moal <damien.lemoal@wdc.com>
Signed-off-by: Martin K. Petersen <martin.petersen@oracle.com>
2021-08-20 10:02:53 +03:00
if ( len > 255 )
return - EIO ;
2021-04-27 11:30:10 +03:00
sdev - > use_10_for_ms = 0 ;
goto retry ;
}
}
2021-04-27 11:30:14 +03:00
if ( scsi_status_is_check_condition ( result ) & &
2021-04-27 11:30:10 +03:00
sshdr - > sense_key = = UNIT_ATTENTION & &
retry_count ) {
retry_count - - ;
2005-04-17 02:20:36 +04:00
goto retry ;
}
}
2021-04-27 11:30:10 +03:00
return - EIO ;
2005-04-17 02:20:36 +04:00
}
2021-04-27 11:30:10 +03:00
if ( unlikely ( buffer [ 0 ] = = 0x86 & & buffer [ 1 ] = = 0x0b & &
( modepage = = 6 | | modepage = = 8 ) ) ) {
/* Initio breakage? */
header_length = 0 ;
data - > length = 13 ;
data - > medium_type = 0 ;
data - > device_specific = 0 ;
data - > longlba = 0 ;
data - > block_descriptor_length = 0 ;
} else if ( use_10_for_ms ) {
scsi: core: Fix scsi_mode_sense() buffer length handling
Several problems exist with scsi_mode_sense() buffer length handling:
1) The allocation length field of the MODE SENSE(10) command is 16-bits,
occupying bytes 7 and 8 of the CDB. With this command, access to mode
pages larger than 255 bytes is thus possible. However, the CDB
allocation length field is set by assigning len to byte 8 only, thus
truncating buffer length larger than 255.
2) If scsi_mode_sense() is called with len smaller than 8 with
sdev->use_10_for_ms set, or smaller than 4 otherwise, the buffer length
is increased to 8 and 4 respectively, and the buffer is zero filled
with these increased values, thus corrupting the memory following the
buffer.
Fix these 2 problems by using put_unaligned_be16() to set the allocation
length field of MODE SENSE(10) CDB and by returning an error when len is
too small.
Furthermore, if len is larger than 255B, always try MODE SENSE(10) first,
even if the device driver did not set sdev->use_10_for_ms. In case of
invalid opcode error for MODE SENSE(10), access to mode pages larger than
255 bytes are not retried using MODE SENSE(6). To avoid buffer length
overflows for the MODE_SENSE(10) case, check that len is smaller than 65535
bytes.
While at it, also fix the folowing:
* Use get_unaligned_be16() to retrieve the mode data length and block
descriptor length fields of the mode sense reply header instead of using
an open coded calculation.
* Fix the kdoc dbd argument explanation: the DBD bit stands for Disable
Block Descriptor, which is the opposite of what the dbd argument
description was.
Link: https://lore.kernel.org/r/20210820070255.682775-2-damien.lemoal@wdc.com
Signed-off-by: Damien Le Moal <damien.lemoal@wdc.com>
Signed-off-by: Martin K. Petersen <martin.petersen@oracle.com>
2021-08-20 10:02:53 +03:00
data - > length = get_unaligned_be16 ( & buffer [ 0 ] ) + 2 ;
2021-04-27 11:30:10 +03:00
data - > medium_type = buffer [ 2 ] ;
data - > device_specific = buffer [ 3 ] ;
data - > longlba = buffer [ 4 ] & 0x01 ;
scsi: core: Fix scsi_mode_sense() buffer length handling
Several problems exist with scsi_mode_sense() buffer length handling:
1) The allocation length field of the MODE SENSE(10) command is 16-bits,
occupying bytes 7 and 8 of the CDB. With this command, access to mode
pages larger than 255 bytes is thus possible. However, the CDB
allocation length field is set by assigning len to byte 8 only, thus
truncating buffer length larger than 255.
2) If scsi_mode_sense() is called with len smaller than 8 with
sdev->use_10_for_ms set, or smaller than 4 otherwise, the buffer length
is increased to 8 and 4 respectively, and the buffer is zero filled
with these increased values, thus corrupting the memory following the
buffer.
Fix these 2 problems by using put_unaligned_be16() to set the allocation
length field of MODE SENSE(10) CDB and by returning an error when len is
too small.
Furthermore, if len is larger than 255B, always try MODE SENSE(10) first,
even if the device driver did not set sdev->use_10_for_ms. In case of
invalid opcode error for MODE SENSE(10), access to mode pages larger than
255 bytes are not retried using MODE SENSE(6). To avoid buffer length
overflows for the MODE_SENSE(10) case, check that len is smaller than 65535
bytes.
While at it, also fix the folowing:
* Use get_unaligned_be16() to retrieve the mode data length and block
descriptor length fields of the mode sense reply header instead of using
an open coded calculation.
* Fix the kdoc dbd argument explanation: the DBD bit stands for Disable
Block Descriptor, which is the opposite of what the dbd argument
description was.
Link: https://lore.kernel.org/r/20210820070255.682775-2-damien.lemoal@wdc.com
Signed-off-by: Damien Le Moal <damien.lemoal@wdc.com>
Signed-off-by: Martin K. Petersen <martin.petersen@oracle.com>
2021-08-20 10:02:53 +03:00
data - > block_descriptor_length = get_unaligned_be16 ( & buffer [ 6 ] ) ;
2021-04-27 11:30:10 +03:00
} else {
data - > length = buffer [ 0 ] + 1 ;
data - > medium_type = buffer [ 1 ] ;
data - > device_specific = buffer [ 2 ] ;
data - > block_descriptor_length = buffer [ 3 ] ;
2005-04-17 02:20:36 +04:00
}
2021-04-27 11:30:10 +03:00
data - > header_length = header_length ;
return 0 ;
2005-04-17 02:20:36 +04:00
}
EXPORT_SYMBOL ( scsi_mode_sense ) ;
2007-12-02 20:10:40 +03:00
/**
* scsi_test_unit_ready - test if unit is ready
* @ sdev : scsi device to change the state of .
* @ timeout : command timeout
* @ retries : number of retries before failing
2017-02-14 22:15:57 +03:00
* @ sshdr : outpout pointer for decoded sense information .
2007-12-02 20:10:40 +03:00
*
* Returns zero if unsuccessful or an error if TUR failed . For
2010-12-08 22:57:40 +03:00
* removable media , UNIT_ATTENTION sets - > changed flag .
2007-12-02 20:10:40 +03:00
* */
2005-04-17 02:20:36 +04:00
int
2007-12-02 20:10:40 +03:00
scsi_test_unit_ready ( struct scsi_device * sdev , int timeout , int retries ,
2017-02-14 22:15:57 +03:00
struct scsi_sense_hdr * sshdr )
2005-04-17 02:20:36 +04:00
{
char cmd [ ] = {
TEST_UNIT_READY , 0 , 0 , 0 , 0 , 0 ,
} ;
int result ;
2007-12-02 20:10:40 +03:00
/* try to eat the UNIT_ATTENTION if there are enough retries */
do {
result = scsi_execute_req ( sdev , cmd , DMA_NONE , NULL , 0 , sshdr ,
2018-02-12 21:57:52 +03:00
timeout , 1 , NULL ) ;
2008-08-20 02:58:13 +04:00
if ( sdev - > removable & & scsi_sense_valid ( sshdr ) & &
sshdr - > sense_key = = UNIT_ATTENTION )
sdev - > changed = 1 ;
} while ( scsi_sense_valid ( sshdr ) & &
sshdr - > sense_key = = UNIT_ATTENTION & & - - retries ) ;
2007-12-02 20:10:40 +03:00
2005-04-17 02:20:36 +04:00
return result ;
}
EXPORT_SYMBOL ( scsi_test_unit_ready ) ;
/**
2007-11-03 21:30:39 +03:00
* scsi_device_set_state - Take the given device through the device state model .
2005-04-17 02:20:36 +04:00
* @ sdev : scsi device to change the state of .
* @ state : state to change to .
*
2017-08-25 14:56:56 +03:00
* Returns zero if successful or an error if the requested
2005-04-17 02:20:36 +04:00
* transition is illegal .
2007-11-03 21:30:39 +03:00
*/
2005-04-17 02:20:36 +04:00
int
scsi_device_set_state ( struct scsi_device * sdev , enum scsi_device_state state )
{
enum scsi_device_state oldstate = sdev - > sdev_state ;
if ( state = = oldstate )
return 0 ;
switch ( state ) {
case SDEV_CREATED :
2008-08-23 01:53:31 +04:00
switch ( oldstate ) {
case SDEV_CREATED_BLOCK :
break ;
default :
goto illegal ;
}
break ;
2020-06-19 18:41:17 +03:00
2005-04-17 02:20:36 +04:00
case SDEV_RUNNING :
switch ( oldstate ) {
case SDEV_CREATED :
case SDEV_OFFLINE :
2012-05-18 08:56:56 +04:00
case SDEV_TRANSPORT_OFFLINE :
2005-04-17 02:20:36 +04:00
case SDEV_QUIESCE :
case SDEV_BLOCK :
break ;
default :
goto illegal ;
}
break ;
case SDEV_QUIESCE :
switch ( oldstate ) {
case SDEV_RUNNING :
case SDEV_OFFLINE :
2012-05-18 08:56:56 +04:00
case SDEV_TRANSPORT_OFFLINE :
2005-04-17 02:20:36 +04:00
break ;
default :
goto illegal ;
}
break ;
case SDEV_OFFLINE :
2012-05-18 08:56:56 +04:00
case SDEV_TRANSPORT_OFFLINE :
2005-04-17 02:20:36 +04:00
switch ( oldstate ) {
case SDEV_CREATED :
case SDEV_RUNNING :
case SDEV_QUIESCE :
case SDEV_BLOCK :
break ;
default :
goto illegal ;
}
break ;
case SDEV_BLOCK :
switch ( oldstate ) {
case SDEV_RUNNING :
2008-08-23 01:53:31 +04:00
case SDEV_CREATED_BLOCK :
scsi: core: Allow the state change from SDEV_QUIESCE to SDEV_BLOCK
The APIs scsi_host_block()/scsi_host_unblock() were recently added by
commit 2bb955840c1d ("scsi: core: add scsi_host_(block,unblock) helper
function") and so far the APIs are only used by: commit 3d3ca53b1639
("scsi: aacraid: use scsi_host_(block,unblock) to block I/O").
However, from reading the code, I think the APIs don't really work for
aacraid, because, in the resume path of hibernation, when aac_suspend() ->
scsi_host_block() is called, scsi_device_quiesce() has set the state to
SDEV_QUIESCE, so aac_suspend() -> scsi_host_block() returns -EINVAL.
Fix the issue by allowing the state change.
Link: https://lore.kernel.org/r/1587170445-50013-1-git-send-email-decui@microsoft.com
Fixes: 2bb955840c1d ("scsi: core: add scsi_host_(block,unblock) helper function")
Reviewed-by: Ewan D. Milne <emilne@redhat.com>
Reviewed-by: Ming Lei <ming.lei@redhat.com>
Signed-off-by: Dexuan Cui <decui@microsoft.com>
Signed-off-by: Martin K. Petersen <martin.petersen@oracle.com>
2020-04-18 03:40:45 +03:00
case SDEV_QUIESCE :
2018-10-07 11:35:35 +03:00
case SDEV_OFFLINE :
2008-08-23 01:53:31 +04:00
break ;
default :
goto illegal ;
}
break ;
case SDEV_CREATED_BLOCK :
switch ( oldstate ) {
case SDEV_CREATED :
2005-04-17 02:20:36 +04:00
break ;
default :
goto illegal ;
}
break ;
case SDEV_CANCEL :
switch ( oldstate ) {
case SDEV_CREATED :
case SDEV_RUNNING :
2006-06-23 22:25:34 +04:00
case SDEV_QUIESCE :
2005-04-17 02:20:36 +04:00
case SDEV_OFFLINE :
2012-05-18 08:56:56 +04:00
case SDEV_TRANSPORT_OFFLINE :
2005-04-17 02:20:36 +04:00
break ;
default :
goto illegal ;
}
break ;
case SDEV_DEL :
switch ( oldstate ) {
[SCSI] scsi: Device scanning oops for offlined devices (resend)
If a device gets offlined as a result of the Inquiry sent
during scanning, the following oops can occur. After the
disk gets put into the SDEV_OFFLINE state, the error handler
sends back the failed inquiry, which wakes the thread doing
the scan. This starts a race between the scanning thread
freeing the scsi device and the error handler calling
scsi_run_host_queues to restart the host. Since the disk
is in the SDEV_OFFLINE state, scsi_device_get will still
work, which results in __scsi_iterate_devices getting
a reference to the scsi disk when it shouldn't.
The following execution thread causes the oops:
CPU 0 (scan) CPU 1 (eh)
---------------------------------------------------------
scsi_probe_and_add_lun
....
scsi_eh_offline_sdevs
scsi_eh_flush_done_q
scsi_destroy_sdev
scsi_device_dev_release
scsi_restart_operations
scsi_run_host_queues
__scsi_iterate_devices
get_device
scsi_device_dev_release_usercontext
scsi_run_queue
<---OOPS--->
The patch fixes this by changing the state of the sdev to SDEV_DEL
before doing the final put_device, which should prevent the race
from occurring.
Original oops follows:
Badness in kref_get at lib/kref.c:32
Call Trace:
[C00000002F4476D0] [C00000000000EE20] .show_stack+0x68/0x1b0 (unreliable)
[C00000002F447770] [C00000000037515C] .program_check_exception+0x1cc/0x5a8
[C00000002F447840] [C00000000000446C] program_check_common+0xec/0x100
Exception: 700 at .kref_get+0x10/0x28
LR = .kobject_get+0x20/0x3c
[C00000002F447B30] [C00000002F447BC0] 0xc00000002f447bc0 (unreliable)
[C00000002F447BB0] [C000000000254BDC] .get_device+0x20/0x3c
[C00000002F447C30] [D000000000063188] .scsi_device_get+0x34/0xdc [scsi_mod]
[C00000002F447CC0] [D0000000000633EC] .__scsi_iterate_devices+0x50/0xbc [scsi_mod]
[C00000002F447D60] [D00000000006A910] .scsi_run_host_queues+0x34/0x5c [scsi_mod]
[C00000002F447DF0] [D000000000069054] .scsi_error_handler+0xdb4/0xe44 [scsi_mod]
[C00000002F447EE0] [C00000000007B4E0] .kthread+0x128/0x178
[C00000002F447F90] [C000000000025E84] .kernel_thread+0x4c/0x68
Unable to handle kernel paging request for <7>PCI: Enabling device: (0002:41:01.1), cmd 143
data at address 0x000001b8
Faulting instruction address: 0xd0000000000698e4
sym1: <1010-66> rev 0x1 at pci 0002:41:01.1 irq 216
sym1: No NVRAM, ID 7, Fast-80, LVD, parity checking
sym1: SCSI BUS has been reset.
scsi2 : sym-2.2.2
cpu 0x0: Vector: 300 (Data Access) at [c00000002f447a30]
pc: d0000000000698e4: .scsi_run_queue+0x2c/0x218 [scsi_mod]
lr: d00000000006a904: .scsi_run_host_queues+0x28/0x5c [scsi_mod]
sp: c00000002f447cb0
msr: 9000000000009032
dar: 1b8
dsisr: 40000000
current = 0xc0000000045fecd0
paca = 0xc00000000048ee80
pid = 1123, comm = scsi_eh_1
enter ? for help
[c00000002f447d60] d00000000006a904 .scsi_run_host_queues+0x28/0x5c [scsi_mod]
[c00000002f447df0] d000000000069054 .scsi_error_handler+0xdb4/0xe44 [scsi_mod]
[c00000002f447ee0] c00000000007b4e0 .kthread+0x128/0x178
[c00000002f447f90] c000000000025e84 .kernel_thread+0x4c/0x68
Signed-off-by: Brian King <brking@us.ibm.com>
Signed-off-by: James Bottomley <James.Bottomley@SteelEye.com>
2006-06-27 20:10:43 +04:00
case SDEV_CREATED :
case SDEV_RUNNING :
case SDEV_OFFLINE :
2012-05-18 08:56:56 +04:00
case SDEV_TRANSPORT_OFFLINE :
2005-04-17 02:20:36 +04:00
case SDEV_CANCEL :
2017-06-03 00:21:57 +03:00
case SDEV_BLOCK :
2013-07-02 17:06:33 +04:00
case SDEV_CREATED_BLOCK :
2005-04-17 02:20:36 +04:00
break ;
default :
goto illegal ;
}
break ;
}
2020-03-11 17:39:30 +03:00
sdev - > offline_already = false ;
2005-04-17 02:20:36 +04:00
sdev - > sdev_state = state ;
return 0 ;
illegal :
2014-06-25 18:39:59 +04:00
SCSI_LOG_ERROR_RECOVERY ( 1 ,
2005-10-02 20:45:08 +04:00
sdev_printk ( KERN_ERR , sdev ,
2014-06-25 18:39:59 +04:00
" Illegal state transition %s->%s " ,
2005-10-02 20:45:08 +04:00
scsi_device_state_name ( oldstate ) ,
scsi_device_state_name ( state ) )
2005-04-17 02:20:36 +04:00
) ;
return - EINVAL ;
}
EXPORT_SYMBOL ( scsi_device_set_state ) ;
2007-10-30 00:15:22 +03:00
/**
2020-10-23 19:33:14 +03:00
* scsi_evt_emit - emit a single SCSI device uevent
2007-10-30 00:15:22 +03:00
* @ sdev : associated SCSI device
* @ evt : event to emit
*
* Send a single uevent ( scsi_event ) to the associated scsi_device .
*/
static void scsi_evt_emit ( struct scsi_device * sdev , struct scsi_event * evt )
{
int idx = 0 ;
char * envp [ 3 ] ;
switch ( evt - > evt_type ) {
case SDEV_EVT_MEDIA_CHANGE :
envp [ idx + + ] = " SDEV_MEDIA_CHANGE=1 " ;
break ;
2013-08-08 23:07:48 +04:00
case SDEV_EVT_INQUIRY_CHANGE_REPORTED :
2016-02-19 11:17:16 +03:00
scsi_rescan_device ( & sdev - > sdev_gendev ) ;
2013-08-08 23:07:48 +04:00
envp [ idx + + ] = " SDEV_UA=INQUIRY_DATA_HAS_CHANGED " ;
break ;
case SDEV_EVT_CAPACITY_CHANGE_REPORTED :
envp [ idx + + ] = " SDEV_UA=CAPACITY_DATA_HAS_CHANGED " ;
break ;
case SDEV_EVT_SOFT_THRESHOLD_REACHED_REPORTED :
envp [ idx + + ] = " SDEV_UA=THIN_PROVISIONING_SOFT_THRESHOLD_REACHED " ;
break ;
case SDEV_EVT_MODE_PARAMETER_CHANGE_REPORTED :
envp [ idx + + ] = " SDEV_UA=MODE_PARAMETERS_CHANGED " ;
break ;
case SDEV_EVT_LUN_CHANGE_REPORTED :
envp [ idx + + ] = " SDEV_UA=REPORTED_LUNS_DATA_HAS_CHANGED " ;
break ;
2015-07-06 14:41:53 +03:00
case SDEV_EVT_ALUA_STATE_CHANGE_REPORTED :
envp [ idx + + ] = " SDEV_UA=ASYMMETRIC_ACCESS_STATE_CHANGED " ;
break ;
2017-10-17 10:11:24 +03:00
case SDEV_EVT_POWER_ON_RESET_OCCURRED :
envp [ idx + + ] = " SDEV_UA=POWER_ON_RESET_OCCURRED " ;
break ;
2007-10-30 00:15:22 +03:00
default :
/* do nothing */
break ;
}
envp [ idx + + ] = NULL ;
kobject_uevent_env ( & sdev - > sdev_gendev . kobj , KOBJ_CHANGE , envp ) ;
}
/**
2020-10-23 19:33:14 +03:00
* scsi_evt_thread - send a uevent for each scsi event
2007-10-30 00:15:22 +03:00
* @ work : work struct for scsi_device
*
* Dispatch queued events to their associated scsi_device kobjects
* as uevents .
*/
void scsi_evt_thread ( struct work_struct * work )
{
struct scsi_device * sdev ;
2013-08-08 23:07:48 +04:00
enum scsi_device_event evt_type ;
2007-10-30 00:15:22 +03:00
LIST_HEAD ( event_list ) ;
sdev = container_of ( work , struct scsi_device , event_work ) ;
2013-08-08 23:07:48 +04:00
for ( evt_type = SDEV_EVT_FIRST ; evt_type < = SDEV_EVT_LAST ; evt_type + + )
if ( test_and_clear_bit ( evt_type , sdev - > pending_events ) )
sdev_evt_send_simple ( sdev , evt_type , GFP_KERNEL ) ;
2007-10-30 00:15:22 +03:00
while ( 1 ) {
struct scsi_event * evt ;
struct list_head * this , * tmp ;
unsigned long flags ;
spin_lock_irqsave ( & sdev - > list_lock , flags ) ;
list_splice_init ( & sdev - > event_list , & event_list ) ;
spin_unlock_irqrestore ( & sdev - > list_lock , flags ) ;
if ( list_empty ( & event_list ) )
break ;
list_for_each_safe ( this , tmp , & event_list ) {
evt = list_entry ( this , struct scsi_event , node ) ;
list_del ( & evt - > node ) ;
scsi_evt_emit ( sdev , evt ) ;
kfree ( evt ) ;
}
}
}
/**
* sdev_evt_send - send asserted event to uevent thread
* @ sdev : scsi_device event occurred on
* @ evt : event to send
*
* Assert scsi device event asynchronously .
*/
void sdev_evt_send ( struct scsi_device * sdev , struct scsi_event * evt )
{
unsigned long flags ;
2008-03-19 15:04:47 +03:00
#if 0
/* FIXME: currently this check eliminates all media change events
* for polled devices . Need to update to discriminate between AN
* and polled events */
2007-10-30 00:15:22 +03:00
if ( ! test_bit ( evt - > evt_type , sdev - > supported_events ) ) {
kfree ( evt ) ;
return ;
}
2008-03-19 15:04:47 +03:00
# endif
2007-10-30 00:15:22 +03:00
spin_lock_irqsave ( & sdev - > list_lock , flags ) ;
list_add_tail ( & evt - > node , & sdev - > event_list ) ;
schedule_work ( & sdev - > event_work ) ;
spin_unlock_irqrestore ( & sdev - > list_lock , flags ) ;
}
EXPORT_SYMBOL_GPL ( sdev_evt_send ) ;
/**
* sdev_evt_alloc - allocate a new scsi event
* @ evt_type : type of event to allocate
* @ gfpflags : GFP flags for allocation
*
* Allocates and returns a new scsi_event .
*/
struct scsi_event * sdev_evt_alloc ( enum scsi_device_event evt_type ,
gfp_t gfpflags )
{
struct scsi_event * evt = kzalloc ( sizeof ( struct scsi_event ) , gfpflags ) ;
if ( ! evt )
return NULL ;
evt - > evt_type = evt_type ;
INIT_LIST_HEAD ( & evt - > node ) ;
/* evt_type-specific initialization, if any */
switch ( evt_type ) {
case SDEV_EVT_MEDIA_CHANGE :
2013-08-08 23:07:48 +04:00
case SDEV_EVT_INQUIRY_CHANGE_REPORTED :
case SDEV_EVT_CAPACITY_CHANGE_REPORTED :
case SDEV_EVT_SOFT_THRESHOLD_REACHED_REPORTED :
case SDEV_EVT_MODE_PARAMETER_CHANGE_REPORTED :
case SDEV_EVT_LUN_CHANGE_REPORTED :
2015-07-06 14:41:53 +03:00
case SDEV_EVT_ALUA_STATE_CHANGE_REPORTED :
2017-10-17 10:11:24 +03:00
case SDEV_EVT_POWER_ON_RESET_OCCURRED :
2007-10-30 00:15:22 +03:00
default :
/* do nothing */
break ;
}
return evt ;
}
EXPORT_SYMBOL_GPL ( sdev_evt_alloc ) ;
/**
* sdev_evt_send_simple - send asserted event to uevent thread
* @ sdev : scsi_device event occurred on
* @ evt_type : type of event to send
* @ gfpflags : GFP flags for allocation
*
* Assert scsi device event asynchronously , given an event type .
*/
void sdev_evt_send_simple ( struct scsi_device * sdev ,
enum scsi_device_event evt_type , gfp_t gfpflags )
{
struct scsi_event * evt = sdev_evt_alloc ( evt_type , gfpflags ) ;
if ( ! evt ) {
sdev_printk ( KERN_ERR , sdev , " event %d eaten due to OOM \n " ,
evt_type ) ;
return ;
}
sdev_evt_send ( sdev , evt ) ;
}
EXPORT_SYMBOL_GPL ( sdev_evt_send_simple ) ;
2005-04-17 02:20:36 +04:00
/**
2020-12-09 08:29:49 +03:00
* scsi_device_quiesce - Block all commands except power management .
2005-04-17 02:20:36 +04:00
* @ sdev : scsi device to quiesce .
*
* This works by trying to transition to the SDEV_QUIESCE state
* ( which must be a legal transition ) . When the device is in this
2020-12-09 08:29:49 +03:00
* state , only power management requests will be accepted , all others will
* be deferred .
2005-04-17 02:20:36 +04:00
*
* Must be called with user context , may sleep .
*
* Returns zero if unsuccessful or an error if not .
2007-11-03 21:30:39 +03:00
*/
2005-04-17 02:20:36 +04:00
int
scsi_device_quiesce ( struct scsi_device * sdev )
{
2017-11-09 21:49:58 +03:00
struct request_queue * q = sdev - > request_queue ;
2017-06-03 00:21:55 +03:00
int err ;
2017-11-09 21:49:58 +03:00
/*
* It is allowed to call scsi_device_quiesce ( ) multiple times from
* the same context but concurrent scsi_device_quiesce ( ) calls are
* not allowed .
*/
WARN_ON_ONCE ( sdev - > quiesced_by & & sdev - > quiesced_by ! = current ) ;
2018-09-27 00:01:04 +03:00
if ( sdev - > quiesced_by = = current )
return 0 ;
blk_set_pm_only ( q ) ;
2017-11-09 21:49:58 +03:00
blk_mq_freeze_queue ( q ) ;
/*
2018-09-27 00:01:04 +03:00
* Ensure that the effect of blk_set_pm_only ( ) will be visible
2017-11-09 21:49:58 +03:00
* for percpu_ref_tryget ( ) callers that occur after the queue
* unfreeze even if the queue was already frozen before this function
* was called . See also https : //lwn.net/Articles/573497/.
*/
synchronize_rcu ( ) ;
blk_mq_unfreeze_queue ( q ) ;
2017-06-03 00:21:55 +03:00
mutex_lock ( & sdev - > state_mutex ) ;
err = scsi_device_set_state ( sdev , SDEV_QUIESCE ) ;
2017-11-09 21:49:58 +03:00
if ( err = = 0 )
sdev - > quiesced_by = current ;
else
2018-09-27 00:01:04 +03:00
blk_clear_pm_only ( q ) ;
2017-06-03 00:21:55 +03:00
mutex_unlock ( & sdev - > state_mutex ) ;
2017-11-09 21:49:58 +03:00
return err ;
2005-04-17 02:20:36 +04:00
}
EXPORT_SYMBOL ( scsi_device_quiesce ) ;
/**
* scsi_device_resume - Restart user issued commands to a quiesced device .
* @ sdev : scsi device to resume .
*
* Moves the device from quiesced back to running and restarts the
* queues .
*
* Must be called with user context , may sleep .
2007-11-03 21:30:39 +03:00
*/
2012-03-23 04:05:11 +04:00
void scsi_device_resume ( struct scsi_device * sdev )
2005-04-17 02:20:36 +04:00
{
2012-03-23 04:05:11 +04:00
/* check if the device state was mutated prior to resume, and if
* so assume the state is being managed elsewhere ( for example
* device deleted during suspend )
*/
2017-06-03 00:21:55 +03:00
mutex_lock ( & sdev - > state_mutex ) ;
2020-12-09 08:29:49 +03:00
if ( sdev - > sdev_state = = SDEV_QUIESCE )
scsi_device_set_state ( sdev , SDEV_RUNNING ) ;
2019-03-16 02:27:58 +03:00
if ( sdev - > quiesced_by ) {
sdev - > quiesced_by = NULL ;
blk_clear_pm_only ( sdev - > request_queue ) ;
}
2017-06-03 00:21:55 +03:00
mutex_unlock ( & sdev - > state_mutex ) ;
2005-04-17 02:20:36 +04:00
}
EXPORT_SYMBOL ( scsi_device_resume ) ;
static void
device_quiesce_fn ( struct scsi_device * sdev , void * data )
{
scsi_device_quiesce ( sdev ) ;
}
void
scsi_target_quiesce ( struct scsi_target * starget )
{
starget_for_each_device ( starget , NULL , device_quiesce_fn ) ;
}
EXPORT_SYMBOL ( scsi_target_quiesce ) ;
static void
device_resume_fn ( struct scsi_device * sdev , void * data )
{
scsi_device_resume ( sdev ) ;
}
void
scsi_target_resume ( struct scsi_target * starget )
{
starget_for_each_device ( starget , NULL , device_resume_fn ) ;
}
EXPORT_SYMBOL ( scsi_target_resume ) ;
2021-11-09 10:11:42 +03:00
static int __scsi_internal_device_block_nowait ( struct scsi_device * sdev )
{
if ( scsi_device_set_state ( sdev , SDEV_BLOCK ) )
return scsi_device_set_state ( sdev , SDEV_CREATED_BLOCK ) ;
return 0 ;
}
2021-11-09 10:11:43 +03:00
void scsi_start_queue ( struct scsi_device * sdev )
{
if ( cmpxchg ( & sdev - > queue_stopped , 1 , 0 ) )
blk_mq_unquiesce_queue ( sdev - > request_queue ) ;
}
static void scsi_stop_queue ( struct scsi_device * sdev , bool nowait )
{
/*
* The atomic variable of - > queue_stopped covers that
* blk_mq_quiesce_queue * is balanced with blk_mq_unquiesce_queue .
*
* However , we still need to wait until quiesce is done
* in case that queue has been stopped .
*/
if ( ! cmpxchg ( & sdev - > queue_stopped , 0 , 1 ) ) {
if ( nowait )
blk_mq_quiesce_queue_nowait ( sdev - > request_queue ) ;
else
blk_mq_quiesce_queue ( sdev - > request_queue ) ;
} else {
if ( ! nowait )
blk_mq_wait_quiesce_done ( sdev - > request_queue ) ;
}
}
2005-04-17 02:20:36 +04:00
/**
2017-06-03 00:21:53 +03:00
* scsi_internal_device_block_nowait - try to transition to the SDEV_BLOCK state
* @ sdev : device to block
2005-04-17 02:20:36 +04:00
*
2017-06-03 00:21:53 +03:00
* Pause SCSI command processing on the specified device . Does not sleep .
2005-04-17 02:20:36 +04:00
*
2017-06-03 00:21:53 +03:00
* Returns zero if successful or a negative error code upon failure .
2016-11-23 03:17:13 +03:00
*
2017-06-03 00:21:53 +03:00
* Notes :
* This routine transitions the device to the SDEV_BLOCK state ( which must be
* a legal transition ) . When the device is in this state , command processing
* is paused until the device leaves the SDEV_BLOCK state . See also
* scsi_internal_device_unblock_nowait ( ) .
2007-11-03 21:30:39 +03:00
*/
2017-06-03 00:21:53 +03:00
int scsi_internal_device_block_nowait ( struct scsi_device * sdev )
2005-04-17 02:20:36 +04:00
{
2021-11-09 10:11:42 +03:00
int ret = __scsi_internal_device_block_nowait ( sdev ) ;
2005-04-17 02:20:36 +04:00
2020-06-19 18:41:17 +03:00
/*
2005-04-17 02:20:36 +04:00
* The device has transitioned to SDEV_BLOCK . Stop the
* block layer from calling the midlayer with this device ' s
2020-06-19 18:41:17 +03:00
* request queue .
2005-04-17 02:20:36 +04:00
*/
2021-11-09 10:11:42 +03:00
if ( ! ret )
2021-11-09 10:11:43 +03:00
scsi_stop_queue ( sdev , true ) ;
2021-11-09 10:11:42 +03:00
return ret ;
2005-04-17 02:20:36 +04:00
}
2017-06-03 00:21:53 +03:00
EXPORT_SYMBOL_GPL ( scsi_internal_device_block_nowait ) ;
2005-04-17 02:20:36 +04:00
/**
2017-06-03 00:21:53 +03:00
* scsi_internal_device_block - try to transition to the SDEV_BLOCK state
* @ sdev : device to block
*
* Pause SCSI command processing on the specified device and wait until all
* ongoing scsi_request_fn ( ) / scsi_queue_rq ( ) calls have finished . May sleep .
2005-04-17 02:20:36 +04:00
*
2017-06-03 00:21:53 +03:00
* Returns zero if successful or a negative error code upon failure .
2005-04-17 02:20:36 +04:00
*
2017-06-03 00:21:53 +03:00
* Note :
* This routine transitions the device to the SDEV_BLOCK state ( which must be
* a legal transition ) . When the device is in this state , command processing
* is paused until the device leaves the SDEV_BLOCK state . See also
* scsi_internal_device_unblock ( ) .
2007-11-03 21:30:39 +03:00
*/
2017-06-03 00:21:53 +03:00
static int scsi_internal_device_block ( struct scsi_device * sdev )
2005-04-17 02:20:36 +04:00
{
2017-06-03 00:21:53 +03:00
int err ;
2017-06-03 00:21:55 +03:00
mutex_lock ( & sdev - > state_mutex ) ;
2021-11-09 10:11:42 +03:00
err = __scsi_internal_device_block_nowait ( sdev ) ;
2018-11-02 01:36:27 +03:00
if ( err = = 0 )
2021-11-09 10:11:43 +03:00
scsi_stop_queue ( sdev , false ) ;
2017-06-03 00:21:55 +03:00
mutex_unlock ( & sdev - > state_mutex ) ;
2017-06-03 00:21:53 +03:00
return err ;
}
2020-06-19 18:41:17 +03:00
2005-04-17 02:20:36 +04:00
/**
2017-06-03 00:21:54 +03:00
* scsi_internal_device_unblock_nowait - resume a device after a block request
2005-04-17 02:20:36 +04:00
* @ sdev : device to resume
2017-06-03 00:21:54 +03:00
* @ new_state : state to set the device to after unblocking
2005-04-17 02:20:36 +04:00
*
2017-06-03 00:21:54 +03:00
* Restart the device queue for a previously suspended SCSI device . Does not
* sleep .
2005-04-17 02:20:36 +04:00
*
2017-06-03 00:21:54 +03:00
* Returns zero if successful or a negative error code upon failure .
2005-04-17 02:20:36 +04:00
*
2017-06-03 00:21:54 +03:00
* Notes :
* This routine transitions the device to the SDEV_RUNNING state or to one of
* the offline states ( which must be a legal transition ) allowing the midlayer
* to goose the queue for this device .
2007-11-03 21:30:39 +03:00
*/
2017-06-03 00:21:54 +03:00
int scsi_internal_device_unblock_nowait ( struct scsi_device * sdev ,
enum scsi_device_state new_state )
2005-04-17 02:20:36 +04:00
{
2019-08-02 01:38:12 +03:00
switch ( new_state ) {
case SDEV_RUNNING :
case SDEV_TRANSPORT_OFFLINE :
break ;
default :
return - EINVAL ;
}
2012-05-18 08:56:57 +04:00
/*
* Try to transition the scsi device to SDEV_RUNNING or one of the
* offlined states and goose the device queue if successful .
2005-04-17 02:20:36 +04:00
*/
2017-08-11 09:53:46 +03:00
switch ( sdev - > sdev_state ) {
case SDEV_BLOCK :
case SDEV_TRANSPORT_OFFLINE :
2012-05-18 08:56:57 +04:00
sdev - > sdev_state = new_state ;
2017-08-11 09:53:46 +03:00
break ;
case SDEV_CREATED_BLOCK :
2012-05-18 08:56:57 +04:00
if ( new_state = = SDEV_TRANSPORT_OFFLINE | |
new_state = = SDEV_OFFLINE )
sdev - > sdev_state = new_state ;
else
sdev - > sdev_state = SDEV_CREATED ;
2017-08-11 09:53:46 +03:00
break ;
case SDEV_CANCEL :
case SDEV_OFFLINE :
break ;
default :
2009-04-29 20:13:02 +04:00
return - EINVAL ;
2017-08-11 09:53:46 +03:00
}
2017-06-03 00:21:56 +03:00
scsi_start_queue ( sdev ) ;
2005-04-17 02:20:36 +04:00
return 0 ;
}
2017-06-03 00:21:54 +03:00
EXPORT_SYMBOL_GPL ( scsi_internal_device_unblock_nowait ) ;
/**
* scsi_internal_device_unblock - resume a device after a block request
* @ sdev : device to resume
* @ new_state : state to set the device to after unblocking
*
* Restart the device queue for a previously suspended SCSI device . May sleep .
*
* Returns zero if successful or a negative error code upon failure .
*
* Notes :
* This routine transitions the device to the SDEV_RUNNING state or to one of
* the offline states ( which must be a legal transition ) allowing the midlayer
* to goose the queue for this device .
*/
static int scsi_internal_device_unblock ( struct scsi_device * sdev ,
enum scsi_device_state new_state )
{
2017-06-03 00:21:55 +03:00
int ret ;
mutex_lock ( & sdev - > state_mutex ) ;
ret = scsi_internal_device_unblock_nowait ( sdev , new_state ) ;
mutex_unlock ( & sdev - > state_mutex ) ;
return ret ;
2017-06-03 00:21:54 +03:00
}
2005-04-17 02:20:36 +04:00
static void
device_block ( struct scsi_device * sdev , void * data )
{
2019-08-02 01:38:13 +03:00
int ret ;
ret = scsi_internal_device_block ( sdev ) ;
WARN_ONCE ( ret , " scsi_internal_device_block(%s) failed: ret = %d \n " ,
dev_name ( & sdev - > sdev_gendev ) , ret ) ;
2005-04-17 02:20:36 +04:00
}
static int
target_block ( struct device * dev , void * data )
{
if ( scsi_is_target_device ( dev ) )
starget_for_each_device ( to_scsi_target ( dev ) , NULL ,
device_block ) ;
return 0 ;
}
void
scsi_target_block ( struct device * dev )
{
if ( scsi_is_target_device ( dev ) )
starget_for_each_device ( to_scsi_target ( dev ) , NULL ,
device_block ) ;
else
device_for_each_child ( dev , NULL , target_block ) ;
}
EXPORT_SYMBOL_GPL ( scsi_target_block ) ;
static void
device_unblock ( struct scsi_device * sdev , void * data )
{
2012-05-18 08:56:57 +04:00
scsi_internal_device_unblock ( sdev , * ( enum scsi_device_state * ) data ) ;
2005-04-17 02:20:36 +04:00
}
static int
target_unblock ( struct device * dev , void * data )
{
if ( scsi_is_target_device ( dev ) )
2012-05-18 08:56:57 +04:00
starget_for_each_device ( to_scsi_target ( dev ) , data ,
2005-04-17 02:20:36 +04:00
device_unblock ) ;
return 0 ;
}
void
2012-05-18 08:56:57 +04:00
scsi_target_unblock ( struct device * dev , enum scsi_device_state new_state )
2005-04-17 02:20:36 +04:00
{
if ( scsi_is_target_device ( dev ) )
2012-05-18 08:56:57 +04:00
starget_for_each_device ( to_scsi_target ( dev ) , & new_state ,
2005-04-17 02:20:36 +04:00
device_unblock ) ;
else
2012-05-18 08:56:57 +04:00
device_for_each_child ( dev , & new_state , target_unblock ) ;
2005-04-17 02:20:36 +04:00
}
EXPORT_SYMBOL_GPL ( scsi_target_unblock ) ;
[SCSI] dc395x: dynamically map scatter-gather for PIO
The current dc395x driver uses PIO to transfer up to 4 bytes which do not
get transferred by DMA (under unclear circumstances). For this the driver
uses page_address() which is broken on highmem. Apart from this the
actual calculation of the virtual address is wrong (even without highmem).
So, e.g., for reading it reads bytes from the driver to a wrong address
and returns wrong data, I guess, for writing it would just output random
data to the device.
The proper fix, as suggested by many, is to dynamically map data using
kmap_atomic(page, KM_BIO_SRC_IRQ) / kunmap_atomic(virt). The reason why it
has not been done until now, although I've done some preliminary patches
more than a year ago was that nobody interested in fixing this problem was
able to reliably reproduce it. Now it changed - with the help from
Sebastian Frei (CC'ed) I was able to trigger the PIO path. Thus, I was
also able to test and debug it.
There are 4 cases when PIO is used in dc395x - data-in / -out with and
without scatter-gather. I was able to reproduce and test only data-in with
and without SG. So, the data-out path is still untested, but it is also
somewhat simpler than the data-in. Fredrik Roubert (also CC'ed) also had
PIO triggering on his system, and in his case it was data-out without SG.
It would be great if he could test the attached patch on his system, but
even if he cannot, I would still request to apply the patch and just wait
if anybody cries...
Implementation: I put 2 new functions in scsi_lib.c and their declarations
in scsi_cmnd.h. I exported them without _GPL, although, I don't feel
strongly about that - not many drivers are likely to use them. But there
is at least one more - I want to use them in tmscsim.c. Whether these are
the right files for the functions and their declarations - not sure
either. Actually, they are not scsi-specific, so, might go somewhere
around other scattergather magic? They are not platform specific either,
and most SG functions are defined under arch/*/... As these issues were
discussed previously there were some more routines suggested to manipulate
scattergather buffers, I think, some of them were needed around
crypto code... So, might be a common place reasonable, like
lib/scattergather.c? I am open here.
Signed-off-by: James Bottomley <James.Bottomley@SteelEye.com>
2006-04-02 23:57:43 +04:00
2020-02-28 10:53:13 +03:00
int
scsi_host_block ( struct Scsi_Host * shost )
{
struct scsi_device * sdev ;
int ret = 0 ;
2020-04-23 05:07:13 +03:00
/*
* Call scsi_internal_device_block_nowait so we can avoid
* calling synchronize_rcu ( ) for each LUN .
*/
2020-02-28 10:53:13 +03:00
shost_for_each_device ( sdev , shost ) {
2020-04-23 05:07:13 +03:00
mutex_lock ( & sdev - > state_mutex ) ;
ret = scsi_internal_device_block_nowait ( sdev ) ;
mutex_unlock ( & sdev - > state_mutex ) ;
2020-07-17 12:09:20 +03:00
if ( ret ) {
scsi_device_put ( sdev ) ;
2020-02-28 10:53:13 +03:00
break ;
2020-07-17 12:09:20 +03:00
}
2020-02-28 10:53:13 +03:00
}
2020-04-23 05:07:13 +03:00
/*
* SCSI never enables blk - mq ' s BLK_MQ_F_BLOCKING flag so
* calling synchronize_rcu ( ) once is enough .
*/
WARN_ON_ONCE ( shost - > tag_set . flags & BLK_MQ_F_BLOCKING ) ;
if ( ! ret )
synchronize_rcu ( ) ;
2020-02-28 10:53:13 +03:00
return ret ;
}
EXPORT_SYMBOL_GPL ( scsi_host_block ) ;
int
scsi_host_unblock ( struct Scsi_Host * shost , int new_state )
{
struct scsi_device * sdev ;
int ret = 0 ;
shost_for_each_device ( sdev , shost ) {
ret = scsi_internal_device_unblock ( sdev , new_state ) ;
2020-05-18 10:44:20 +03:00
if ( ret ) {
scsi_device_put ( sdev ) ;
2020-02-28 10:53:13 +03:00
break ;
2020-05-18 10:44:20 +03:00
}
2020-02-28 10:53:13 +03:00
}
return ret ;
}
EXPORT_SYMBOL_GPL ( scsi_host_unblock ) ;
[SCSI] dc395x: dynamically map scatter-gather for PIO
The current dc395x driver uses PIO to transfer up to 4 bytes which do not
get transferred by DMA (under unclear circumstances). For this the driver
uses page_address() which is broken on highmem. Apart from this the
actual calculation of the virtual address is wrong (even without highmem).
So, e.g., for reading it reads bytes from the driver to a wrong address
and returns wrong data, I guess, for writing it would just output random
data to the device.
The proper fix, as suggested by many, is to dynamically map data using
kmap_atomic(page, KM_BIO_SRC_IRQ) / kunmap_atomic(virt). The reason why it
has not been done until now, although I've done some preliminary patches
more than a year ago was that nobody interested in fixing this problem was
able to reliably reproduce it. Now it changed - with the help from
Sebastian Frei (CC'ed) I was able to trigger the PIO path. Thus, I was
also able to test and debug it.
There are 4 cases when PIO is used in dc395x - data-in / -out with and
without scatter-gather. I was able to reproduce and test only data-in with
and without SG. So, the data-out path is still untested, but it is also
somewhat simpler than the data-in. Fredrik Roubert (also CC'ed) also had
PIO triggering on his system, and in his case it was data-out without SG.
It would be great if he could test the attached patch on his system, but
even if he cannot, I would still request to apply the patch and just wait
if anybody cries...
Implementation: I put 2 new functions in scsi_lib.c and their declarations
in scsi_cmnd.h. I exported them without _GPL, although, I don't feel
strongly about that - not many drivers are likely to use them. But there
is at least one more - I want to use them in tmscsim.c. Whether these are
the right files for the functions and their declarations - not sure
either. Actually, they are not scsi-specific, so, might go somewhere
around other scattergather magic? They are not platform specific either,
and most SG functions are defined under arch/*/... As these issues were
discussed previously there were some more routines suggested to manipulate
scattergather buffers, I think, some of them were needed around
crypto code... So, might be a common place reasonable, like
lib/scattergather.c? I am open here.
Signed-off-by: James Bottomley <James.Bottomley@SteelEye.com>
2006-04-02 23:57:43 +04:00
/**
* scsi_kmap_atomic_sg - find and atomically map an sg - elemnt
2007-11-03 21:30:39 +03:00
* @ sgl : scatter - gather list
[SCSI] dc395x: dynamically map scatter-gather for PIO
The current dc395x driver uses PIO to transfer up to 4 bytes which do not
get transferred by DMA (under unclear circumstances). For this the driver
uses page_address() which is broken on highmem. Apart from this the
actual calculation of the virtual address is wrong (even without highmem).
So, e.g., for reading it reads bytes from the driver to a wrong address
and returns wrong data, I guess, for writing it would just output random
data to the device.
The proper fix, as suggested by many, is to dynamically map data using
kmap_atomic(page, KM_BIO_SRC_IRQ) / kunmap_atomic(virt). The reason why it
has not been done until now, although I've done some preliminary patches
more than a year ago was that nobody interested in fixing this problem was
able to reliably reproduce it. Now it changed - with the help from
Sebastian Frei (CC'ed) I was able to trigger the PIO path. Thus, I was
also able to test and debug it.
There are 4 cases when PIO is used in dc395x - data-in / -out with and
without scatter-gather. I was able to reproduce and test only data-in with
and without SG. So, the data-out path is still untested, but it is also
somewhat simpler than the data-in. Fredrik Roubert (also CC'ed) also had
PIO triggering on his system, and in his case it was data-out without SG.
It would be great if he could test the attached patch on his system, but
even if he cannot, I would still request to apply the patch and just wait
if anybody cries...
Implementation: I put 2 new functions in scsi_lib.c and their declarations
in scsi_cmnd.h. I exported them without _GPL, although, I don't feel
strongly about that - not many drivers are likely to use them. But there
is at least one more - I want to use them in tmscsim.c. Whether these are
the right files for the functions and their declarations - not sure
either. Actually, they are not scsi-specific, so, might go somewhere
around other scattergather magic? They are not platform specific either,
and most SG functions are defined under arch/*/... As these issues were
discussed previously there were some more routines suggested to manipulate
scattergather buffers, I think, some of them were needed around
crypto code... So, might be a common place reasonable, like
lib/scattergather.c? I am open here.
Signed-off-by: James Bottomley <James.Bottomley@SteelEye.com>
2006-04-02 23:57:43 +04:00
* @ sg_count : number of segments in sg
* @ offset : offset in bytes into sg , on return offset into the mapped area
* @ len : bytes to map , on return number of bytes mapped
*
* Returns virtual address of the start of the mapped page
*/
2007-10-16 13:08:49 +04:00
void * scsi_kmap_atomic_sg ( struct scatterlist * sgl , int sg_count ,
[SCSI] dc395x: dynamically map scatter-gather for PIO
The current dc395x driver uses PIO to transfer up to 4 bytes which do not
get transferred by DMA (under unclear circumstances). For this the driver
uses page_address() which is broken on highmem. Apart from this the
actual calculation of the virtual address is wrong (even without highmem).
So, e.g., for reading it reads bytes from the driver to a wrong address
and returns wrong data, I guess, for writing it would just output random
data to the device.
The proper fix, as suggested by many, is to dynamically map data using
kmap_atomic(page, KM_BIO_SRC_IRQ) / kunmap_atomic(virt). The reason why it
has not been done until now, although I've done some preliminary patches
more than a year ago was that nobody interested in fixing this problem was
able to reliably reproduce it. Now it changed - with the help from
Sebastian Frei (CC'ed) I was able to trigger the PIO path. Thus, I was
also able to test and debug it.
There are 4 cases when PIO is used in dc395x - data-in / -out with and
without scatter-gather. I was able to reproduce and test only data-in with
and without SG. So, the data-out path is still untested, but it is also
somewhat simpler than the data-in. Fredrik Roubert (also CC'ed) also had
PIO triggering on his system, and in his case it was data-out without SG.
It would be great if he could test the attached patch on his system, but
even if he cannot, I would still request to apply the patch and just wait
if anybody cries...
Implementation: I put 2 new functions in scsi_lib.c and their declarations
in scsi_cmnd.h. I exported them without _GPL, although, I don't feel
strongly about that - not many drivers are likely to use them. But there
is at least one more - I want to use them in tmscsim.c. Whether these are
the right files for the functions and their declarations - not sure
either. Actually, they are not scsi-specific, so, might go somewhere
around other scattergather magic? They are not platform specific either,
and most SG functions are defined under arch/*/... As these issues were
discussed previously there were some more routines suggested to manipulate
scattergather buffers, I think, some of them were needed around
crypto code... So, might be a common place reasonable, like
lib/scattergather.c? I am open here.
Signed-off-by: James Bottomley <James.Bottomley@SteelEye.com>
2006-04-02 23:57:43 +04:00
size_t * offset , size_t * len )
{
int i ;
size_t sg_len = 0 , len_complete = 0 ;
2007-10-16 13:08:49 +04:00
struct scatterlist * sg ;
[SCSI] dc395x: dynamically map scatter-gather for PIO
The current dc395x driver uses PIO to transfer up to 4 bytes which do not
get transferred by DMA (under unclear circumstances). For this the driver
uses page_address() which is broken on highmem. Apart from this the
actual calculation of the virtual address is wrong (even without highmem).
So, e.g., for reading it reads bytes from the driver to a wrong address
and returns wrong data, I guess, for writing it would just output random
data to the device.
The proper fix, as suggested by many, is to dynamically map data using
kmap_atomic(page, KM_BIO_SRC_IRQ) / kunmap_atomic(virt). The reason why it
has not been done until now, although I've done some preliminary patches
more than a year ago was that nobody interested in fixing this problem was
able to reliably reproduce it. Now it changed - with the help from
Sebastian Frei (CC'ed) I was able to trigger the PIO path. Thus, I was
also able to test and debug it.
There are 4 cases when PIO is used in dc395x - data-in / -out with and
without scatter-gather. I was able to reproduce and test only data-in with
and without SG. So, the data-out path is still untested, but it is also
somewhat simpler than the data-in. Fredrik Roubert (also CC'ed) also had
PIO triggering on his system, and in his case it was data-out without SG.
It would be great if he could test the attached patch on his system, but
even if he cannot, I would still request to apply the patch and just wait
if anybody cries...
Implementation: I put 2 new functions in scsi_lib.c and their declarations
in scsi_cmnd.h. I exported them without _GPL, although, I don't feel
strongly about that - not many drivers are likely to use them. But there
is at least one more - I want to use them in tmscsim.c. Whether these are
the right files for the functions and their declarations - not sure
either. Actually, they are not scsi-specific, so, might go somewhere
around other scattergather magic? They are not platform specific either,
and most SG functions are defined under arch/*/... As these issues were
discussed previously there were some more routines suggested to manipulate
scattergather buffers, I think, some of them were needed around
crypto code... So, might be a common place reasonable, like
lib/scattergather.c? I am open here.
Signed-off-by: James Bottomley <James.Bottomley@SteelEye.com>
2006-04-02 23:57:43 +04:00
struct page * page ;
2007-02-06 03:39:03 +03:00
WARN_ON ( ! irqs_disabled ( ) ) ;
2007-10-16 13:08:49 +04:00
for_each_sg ( sgl , sg , sg_count , i ) {
[SCSI] dc395x: dynamically map scatter-gather for PIO
The current dc395x driver uses PIO to transfer up to 4 bytes which do not
get transferred by DMA (under unclear circumstances). For this the driver
uses page_address() which is broken on highmem. Apart from this the
actual calculation of the virtual address is wrong (even without highmem).
So, e.g., for reading it reads bytes from the driver to a wrong address
and returns wrong data, I guess, for writing it would just output random
data to the device.
The proper fix, as suggested by many, is to dynamically map data using
kmap_atomic(page, KM_BIO_SRC_IRQ) / kunmap_atomic(virt). The reason why it
has not been done until now, although I've done some preliminary patches
more than a year ago was that nobody interested in fixing this problem was
able to reliably reproduce it. Now it changed - with the help from
Sebastian Frei (CC'ed) I was able to trigger the PIO path. Thus, I was
also able to test and debug it.
There are 4 cases when PIO is used in dc395x - data-in / -out with and
without scatter-gather. I was able to reproduce and test only data-in with
and without SG. So, the data-out path is still untested, but it is also
somewhat simpler than the data-in. Fredrik Roubert (also CC'ed) also had
PIO triggering on his system, and in his case it was data-out without SG.
It would be great if he could test the attached patch on his system, but
even if he cannot, I would still request to apply the patch and just wait
if anybody cries...
Implementation: I put 2 new functions in scsi_lib.c and their declarations
in scsi_cmnd.h. I exported them without _GPL, although, I don't feel
strongly about that - not many drivers are likely to use them. But there
is at least one more - I want to use them in tmscsim.c. Whether these are
the right files for the functions and their declarations - not sure
either. Actually, they are not scsi-specific, so, might go somewhere
around other scattergather magic? They are not platform specific either,
and most SG functions are defined under arch/*/... As these issues were
discussed previously there were some more routines suggested to manipulate
scattergather buffers, I think, some of them were needed around
crypto code... So, might be a common place reasonable, like
lib/scattergather.c? I am open here.
Signed-off-by: James Bottomley <James.Bottomley@SteelEye.com>
2006-04-02 23:57:43 +04:00
len_complete = sg_len ; /* Complete sg-entries */
2007-10-16 13:08:49 +04:00
sg_len + = sg - > length ;
[SCSI] dc395x: dynamically map scatter-gather for PIO
The current dc395x driver uses PIO to transfer up to 4 bytes which do not
get transferred by DMA (under unclear circumstances). For this the driver
uses page_address() which is broken on highmem. Apart from this the
actual calculation of the virtual address is wrong (even without highmem).
So, e.g., for reading it reads bytes from the driver to a wrong address
and returns wrong data, I guess, for writing it would just output random
data to the device.
The proper fix, as suggested by many, is to dynamically map data using
kmap_atomic(page, KM_BIO_SRC_IRQ) / kunmap_atomic(virt). The reason why it
has not been done until now, although I've done some preliminary patches
more than a year ago was that nobody interested in fixing this problem was
able to reliably reproduce it. Now it changed - with the help from
Sebastian Frei (CC'ed) I was able to trigger the PIO path. Thus, I was
also able to test and debug it.
There are 4 cases when PIO is used in dc395x - data-in / -out with and
without scatter-gather. I was able to reproduce and test only data-in with
and without SG. So, the data-out path is still untested, but it is also
somewhat simpler than the data-in. Fredrik Roubert (also CC'ed) also had
PIO triggering on his system, and in his case it was data-out without SG.
It would be great if he could test the attached patch on his system, but
even if he cannot, I would still request to apply the patch and just wait
if anybody cries...
Implementation: I put 2 new functions in scsi_lib.c and their declarations
in scsi_cmnd.h. I exported them without _GPL, although, I don't feel
strongly about that - not many drivers are likely to use them. But there
is at least one more - I want to use them in tmscsim.c. Whether these are
the right files for the functions and their declarations - not sure
either. Actually, they are not scsi-specific, so, might go somewhere
around other scattergather magic? They are not platform specific either,
and most SG functions are defined under arch/*/... As these issues were
discussed previously there were some more routines suggested to manipulate
scattergather buffers, I think, some of them were needed around
crypto code... So, might be a common place reasonable, like
lib/scattergather.c? I am open here.
Signed-off-by: James Bottomley <James.Bottomley@SteelEye.com>
2006-04-02 23:57:43 +04:00
if ( sg_len > * offset )
break ;
}
if ( unlikely ( i = = sg_count ) ) {
2006-04-19 08:09:08 +04:00
printk ( KERN_ERR " %s: Bytes in sg: %zu, requested offset %zu, "
" elements %d \n " ,
2008-07-04 10:47:27 +04:00
__func__ , sg_len , * offset , sg_count ) ;
[SCSI] dc395x: dynamically map scatter-gather for PIO
The current dc395x driver uses PIO to transfer up to 4 bytes which do not
get transferred by DMA (under unclear circumstances). For this the driver
uses page_address() which is broken on highmem. Apart from this the
actual calculation of the virtual address is wrong (even without highmem).
So, e.g., for reading it reads bytes from the driver to a wrong address
and returns wrong data, I guess, for writing it would just output random
data to the device.
The proper fix, as suggested by many, is to dynamically map data using
kmap_atomic(page, KM_BIO_SRC_IRQ) / kunmap_atomic(virt). The reason why it
has not been done until now, although I've done some preliminary patches
more than a year ago was that nobody interested in fixing this problem was
able to reliably reproduce it. Now it changed - with the help from
Sebastian Frei (CC'ed) I was able to trigger the PIO path. Thus, I was
also able to test and debug it.
There are 4 cases when PIO is used in dc395x - data-in / -out with and
without scatter-gather. I was able to reproduce and test only data-in with
and without SG. So, the data-out path is still untested, but it is also
somewhat simpler than the data-in. Fredrik Roubert (also CC'ed) also had
PIO triggering on his system, and in his case it was data-out without SG.
It would be great if he could test the attached patch on his system, but
even if he cannot, I would still request to apply the patch and just wait
if anybody cries...
Implementation: I put 2 new functions in scsi_lib.c and their declarations
in scsi_cmnd.h. I exported them without _GPL, although, I don't feel
strongly about that - not many drivers are likely to use them. But there
is at least one more - I want to use them in tmscsim.c. Whether these are
the right files for the functions and their declarations - not sure
either. Actually, they are not scsi-specific, so, might go somewhere
around other scattergather magic? They are not platform specific either,
and most SG functions are defined under arch/*/... As these issues were
discussed previously there were some more routines suggested to manipulate
scattergather buffers, I think, some of them were needed around
crypto code... So, might be a common place reasonable, like
lib/scattergather.c? I am open here.
Signed-off-by: James Bottomley <James.Bottomley@SteelEye.com>
2006-04-02 23:57:43 +04:00
WARN_ON ( 1 ) ;
return NULL ;
}
/* Offset starting from the beginning of first page in this sg-entry */
2007-10-16 13:08:49 +04:00
* offset = * offset - len_complete + sg - > offset ;
[SCSI] dc395x: dynamically map scatter-gather for PIO
The current dc395x driver uses PIO to transfer up to 4 bytes which do not
get transferred by DMA (under unclear circumstances). For this the driver
uses page_address() which is broken on highmem. Apart from this the
actual calculation of the virtual address is wrong (even without highmem).
So, e.g., for reading it reads bytes from the driver to a wrong address
and returns wrong data, I guess, for writing it would just output random
data to the device.
The proper fix, as suggested by many, is to dynamically map data using
kmap_atomic(page, KM_BIO_SRC_IRQ) / kunmap_atomic(virt). The reason why it
has not been done until now, although I've done some preliminary patches
more than a year ago was that nobody interested in fixing this problem was
able to reliably reproduce it. Now it changed - with the help from
Sebastian Frei (CC'ed) I was able to trigger the PIO path. Thus, I was
also able to test and debug it.
There are 4 cases when PIO is used in dc395x - data-in / -out with and
without scatter-gather. I was able to reproduce and test only data-in with
and without SG. So, the data-out path is still untested, but it is also
somewhat simpler than the data-in. Fredrik Roubert (also CC'ed) also had
PIO triggering on his system, and in his case it was data-out without SG.
It would be great if he could test the attached patch on his system, but
even if he cannot, I would still request to apply the patch and just wait
if anybody cries...
Implementation: I put 2 new functions in scsi_lib.c and their declarations
in scsi_cmnd.h. I exported them without _GPL, although, I don't feel
strongly about that - not many drivers are likely to use them. But there
is at least one more - I want to use them in tmscsim.c. Whether these are
the right files for the functions and their declarations - not sure
either. Actually, they are not scsi-specific, so, might go somewhere
around other scattergather magic? They are not platform specific either,
and most SG functions are defined under arch/*/... As these issues were
discussed previously there were some more routines suggested to manipulate
scattergather buffers, I think, some of them were needed around
crypto code... So, might be a common place reasonable, like
lib/scattergather.c? I am open here.
Signed-off-by: James Bottomley <James.Bottomley@SteelEye.com>
2006-04-02 23:57:43 +04:00
/* Assumption: contiguous pages can be accessed as "page + i" */
2007-10-22 23:19:53 +04:00
page = nth_page ( sg_page ( sg ) , ( * offset > > PAGE_SHIFT ) ) ;
[SCSI] dc395x: dynamically map scatter-gather for PIO
The current dc395x driver uses PIO to transfer up to 4 bytes which do not
get transferred by DMA (under unclear circumstances). For this the driver
uses page_address() which is broken on highmem. Apart from this the
actual calculation of the virtual address is wrong (even without highmem).
So, e.g., for reading it reads bytes from the driver to a wrong address
and returns wrong data, I guess, for writing it would just output random
data to the device.
The proper fix, as suggested by many, is to dynamically map data using
kmap_atomic(page, KM_BIO_SRC_IRQ) / kunmap_atomic(virt). The reason why it
has not been done until now, although I've done some preliminary patches
more than a year ago was that nobody interested in fixing this problem was
able to reliably reproduce it. Now it changed - with the help from
Sebastian Frei (CC'ed) I was able to trigger the PIO path. Thus, I was
also able to test and debug it.
There are 4 cases when PIO is used in dc395x - data-in / -out with and
without scatter-gather. I was able to reproduce and test only data-in with
and without SG. So, the data-out path is still untested, but it is also
somewhat simpler than the data-in. Fredrik Roubert (also CC'ed) also had
PIO triggering on his system, and in his case it was data-out without SG.
It would be great if he could test the attached patch on his system, but
even if he cannot, I would still request to apply the patch and just wait
if anybody cries...
Implementation: I put 2 new functions in scsi_lib.c and their declarations
in scsi_cmnd.h. I exported them without _GPL, although, I don't feel
strongly about that - not many drivers are likely to use them. But there
is at least one more - I want to use them in tmscsim.c. Whether these are
the right files for the functions and their declarations - not sure
either. Actually, they are not scsi-specific, so, might go somewhere
around other scattergather magic? They are not platform specific either,
and most SG functions are defined under arch/*/... As these issues were
discussed previously there were some more routines suggested to manipulate
scattergather buffers, I think, some of them were needed around
crypto code... So, might be a common place reasonable, like
lib/scattergather.c? I am open here.
Signed-off-by: James Bottomley <James.Bottomley@SteelEye.com>
2006-04-02 23:57:43 +04:00
* offset & = ~ PAGE_MASK ;
/* Bytes in this sg-entry from *offset to the end of the page */
sg_len = PAGE_SIZE - * offset ;
if ( * len > sg_len )
* len = sg_len ;
2011-11-25 19:14:23 +04:00
return kmap_atomic ( page ) ;
[SCSI] dc395x: dynamically map scatter-gather for PIO
The current dc395x driver uses PIO to transfer up to 4 bytes which do not
get transferred by DMA (under unclear circumstances). For this the driver
uses page_address() which is broken on highmem. Apart from this the
actual calculation of the virtual address is wrong (even without highmem).
So, e.g., for reading it reads bytes from the driver to a wrong address
and returns wrong data, I guess, for writing it would just output random
data to the device.
The proper fix, as suggested by many, is to dynamically map data using
kmap_atomic(page, KM_BIO_SRC_IRQ) / kunmap_atomic(virt). The reason why it
has not been done until now, although I've done some preliminary patches
more than a year ago was that nobody interested in fixing this problem was
able to reliably reproduce it. Now it changed - with the help from
Sebastian Frei (CC'ed) I was able to trigger the PIO path. Thus, I was
also able to test and debug it.
There are 4 cases when PIO is used in dc395x - data-in / -out with and
without scatter-gather. I was able to reproduce and test only data-in with
and without SG. So, the data-out path is still untested, but it is also
somewhat simpler than the data-in. Fredrik Roubert (also CC'ed) also had
PIO triggering on his system, and in his case it was data-out without SG.
It would be great if he could test the attached patch on his system, but
even if he cannot, I would still request to apply the patch and just wait
if anybody cries...
Implementation: I put 2 new functions in scsi_lib.c and their declarations
in scsi_cmnd.h. I exported them without _GPL, although, I don't feel
strongly about that - not many drivers are likely to use them. But there
is at least one more - I want to use them in tmscsim.c. Whether these are
the right files for the functions and their declarations - not sure
either. Actually, they are not scsi-specific, so, might go somewhere
around other scattergather magic? They are not platform specific either,
and most SG functions are defined under arch/*/... As these issues were
discussed previously there were some more routines suggested to manipulate
scattergather buffers, I think, some of them were needed around
crypto code... So, might be a common place reasonable, like
lib/scattergather.c? I am open here.
Signed-off-by: James Bottomley <James.Bottomley@SteelEye.com>
2006-04-02 23:57:43 +04:00
}
EXPORT_SYMBOL ( scsi_kmap_atomic_sg ) ;
/**
2007-11-03 21:30:39 +03:00
* scsi_kunmap_atomic_sg - atomically unmap a virtual address , previously mapped with scsi_kmap_atomic_sg
[SCSI] dc395x: dynamically map scatter-gather for PIO
The current dc395x driver uses PIO to transfer up to 4 bytes which do not
get transferred by DMA (under unclear circumstances). For this the driver
uses page_address() which is broken on highmem. Apart from this the
actual calculation of the virtual address is wrong (even without highmem).
So, e.g., for reading it reads bytes from the driver to a wrong address
and returns wrong data, I guess, for writing it would just output random
data to the device.
The proper fix, as suggested by many, is to dynamically map data using
kmap_atomic(page, KM_BIO_SRC_IRQ) / kunmap_atomic(virt). The reason why it
has not been done until now, although I've done some preliminary patches
more than a year ago was that nobody interested in fixing this problem was
able to reliably reproduce it. Now it changed - with the help from
Sebastian Frei (CC'ed) I was able to trigger the PIO path. Thus, I was
also able to test and debug it.
There are 4 cases when PIO is used in dc395x - data-in / -out with and
without scatter-gather. I was able to reproduce and test only data-in with
and without SG. So, the data-out path is still untested, but it is also
somewhat simpler than the data-in. Fredrik Roubert (also CC'ed) also had
PIO triggering on his system, and in his case it was data-out without SG.
It would be great if he could test the attached patch on his system, but
even if he cannot, I would still request to apply the patch and just wait
if anybody cries...
Implementation: I put 2 new functions in scsi_lib.c and their declarations
in scsi_cmnd.h. I exported them without _GPL, although, I don't feel
strongly about that - not many drivers are likely to use them. But there
is at least one more - I want to use them in tmscsim.c. Whether these are
the right files for the functions and their declarations - not sure
either. Actually, they are not scsi-specific, so, might go somewhere
around other scattergather magic? They are not platform specific either,
and most SG functions are defined under arch/*/... As these issues were
discussed previously there were some more routines suggested to manipulate
scattergather buffers, I think, some of them were needed around
crypto code... So, might be a common place reasonable, like
lib/scattergather.c? I am open here.
Signed-off-by: James Bottomley <James.Bottomley@SteelEye.com>
2006-04-02 23:57:43 +04:00
* @ virt : virtual address to be unmapped
*/
void scsi_kunmap_atomic_sg ( void * virt )
{
2011-11-25 19:14:23 +04:00
kunmap_atomic ( virt ) ;
[SCSI] dc395x: dynamically map scatter-gather for PIO
The current dc395x driver uses PIO to transfer up to 4 bytes which do not
get transferred by DMA (under unclear circumstances). For this the driver
uses page_address() which is broken on highmem. Apart from this the
actual calculation of the virtual address is wrong (even without highmem).
So, e.g., for reading it reads bytes from the driver to a wrong address
and returns wrong data, I guess, for writing it would just output random
data to the device.
The proper fix, as suggested by many, is to dynamically map data using
kmap_atomic(page, KM_BIO_SRC_IRQ) / kunmap_atomic(virt). The reason why it
has not been done until now, although I've done some preliminary patches
more than a year ago was that nobody interested in fixing this problem was
able to reliably reproduce it. Now it changed - with the help from
Sebastian Frei (CC'ed) I was able to trigger the PIO path. Thus, I was
also able to test and debug it.
There are 4 cases when PIO is used in dc395x - data-in / -out with and
without scatter-gather. I was able to reproduce and test only data-in with
and without SG. So, the data-out path is still untested, but it is also
somewhat simpler than the data-in. Fredrik Roubert (also CC'ed) also had
PIO triggering on his system, and in his case it was data-out without SG.
It would be great if he could test the attached patch on his system, but
even if he cannot, I would still request to apply the patch and just wait
if anybody cries...
Implementation: I put 2 new functions in scsi_lib.c and their declarations
in scsi_cmnd.h. I exported them without _GPL, although, I don't feel
strongly about that - not many drivers are likely to use them. But there
is at least one more - I want to use them in tmscsim.c. Whether these are
the right files for the functions and their declarations - not sure
either. Actually, they are not scsi-specific, so, might go somewhere
around other scattergather magic? They are not platform specific either,
and most SG functions are defined under arch/*/... As these issues were
discussed previously there were some more routines suggested to manipulate
scattergather buffers, I think, some of them were needed around
crypto code... So, might be a common place reasonable, like
lib/scattergather.c? I am open here.
Signed-off-by: James Bottomley <James.Bottomley@SteelEye.com>
2006-04-02 23:57:43 +04:00
}
EXPORT_SYMBOL ( scsi_kunmap_atomic_sg ) ;
2013-01-23 11:09:32 +04:00
void sdev_disable_disk_events ( struct scsi_device * sdev )
{
atomic_inc ( & sdev - > disk_events_disable_depth ) ;
}
EXPORT_SYMBOL ( sdev_disable_disk_events ) ;
void sdev_enable_disk_events ( struct scsi_device * sdev )
{
if ( WARN_ON_ONCE ( atomic_read ( & sdev - > disk_events_disable_depth ) < = 0 ) )
return ;
atomic_dec ( & sdev - > disk_events_disable_depth ) ;
}
EXPORT_SYMBOL ( sdev_enable_disk_events ) ;
2015-12-01 12:16:55 +03:00
scsi: core: Fix VPD LUN ID designator priorities
The current implementation of scsi_vpd_lun_id() uses the designator length
as an implicit measure of priority. This works most of the time, but not
always. For example, some Hitachi storage arrays return this in VPD 0x83:
VPD INQUIRY: Device Identification page
Designation descriptor number 1, descriptor length: 24
designator_type: T10 vendor identification, code_set: ASCII
associated with the Addressed logical unit
vendor id: HITACHI
vendor specific: 5030C3502025
Designation descriptor number 2, descriptor length: 6
designator_type: vendor specific [0x0], code_set: Binary
associated with the Target port
vendor specific: 08 03
Designation descriptor number 3, descriptor length: 20
designator_type: NAA, code_set: Binary
associated with the Addressed logical unit
NAA 6, IEEE Company_id: 0x60e8
Vendor Specific Identifier: 0x7c35000
Vendor Specific Identifier Extension: 0x30c35000002025
[0x60060e8007c350000030c35000002025]
The current code would use the first descriptor because it's longer than
the NAA descriptor. But this is wrong, the kernel is supposed to prefer NAA
descriptors over T10 vendor ID. Designator length should only be used to
compare designators of the same type.
This patch addresses the issue by separating designator priority and
length.
Link: https://lore.kernel.org/r/20201029170846.14786-1-mwilck@suse.com
Fixes: 9983bed3907c ("scsi: Add scsi_vpd_lun_id()")
Reviewed-by: Hannes Reinecke <hare@suse.de>
Signed-off-by: Martin Wilck <mwilck@suse.com>
Signed-off-by: Martin K. Petersen <martin.petersen@oracle.com>
2020-10-29 20:08:45 +03:00
static unsigned char designator_prio ( const unsigned char * d )
{
if ( d [ 1 ] & 0x30 )
/* not associated with LUN */
return 0 ;
if ( d [ 3 ] = = 0 )
/* invalid length */
return 0 ;
/*
* Order of preference for lun descriptor :
* - SCSI name string
* - NAA IEEE Registered Extended
* - EUI - 64 based 16 - byte
* - EUI - 64 based 12 - byte
* - NAA IEEE Registered
* - NAA IEEE Extended
* - EUI - 64 based 8 - byte
* - SCSI name string ( truncated )
* - T10 Vendor ID
* as longer descriptors reduce the likelyhood
* of identification clashes .
*/
switch ( d [ 1 ] & 0xf ) {
case 8 :
/* SCSI name string, variable-length UTF-8 */
return 9 ;
case 3 :
switch ( d [ 4 ] > > 4 ) {
case 6 :
/* NAA registered extended */
return 8 ;
case 5 :
/* NAA registered */
return 5 ;
case 4 :
/* NAA extended */
return 4 ;
case 3 :
/* NAA locally assigned */
return 1 ;
default :
break ;
}
break ;
case 2 :
switch ( d [ 3 ] ) {
case 16 :
/* EUI64-based, 16 byte */
return 7 ;
case 12 :
/* EUI64-based, 12 byte */
return 6 ;
case 8 :
/* EUI64-based, 8 byte */
return 3 ;
default :
break ;
}
break ;
case 1 :
/* T10 vendor ID */
return 1 ;
default :
break ;
}
return 0 ;
}
2015-12-01 12:16:55 +03:00
/**
* scsi_vpd_lun_id - return a unique device identification
* @ sdev : SCSI device
* @ id : buffer for the identification
* @ id_len : length of the buffer
*
* Copies a unique device identification into @ id based
* on the information in the VPD page 0x83 of the device .
* The string will be formatted as a SCSI name string .
*
* Returns the length of the identification or error on failure .
* If the identifier is longer than the supplied buffer the actual
* identifier length is returned and the buffer is not zero - padded .
*/
int scsi_vpd_lun_id ( struct scsi_device * sdev , char * id , size_t id_len )
{
scsi: core: Fix VPD LUN ID designator priorities
The current implementation of scsi_vpd_lun_id() uses the designator length
as an implicit measure of priority. This works most of the time, but not
always. For example, some Hitachi storage arrays return this in VPD 0x83:
VPD INQUIRY: Device Identification page
Designation descriptor number 1, descriptor length: 24
designator_type: T10 vendor identification, code_set: ASCII
associated with the Addressed logical unit
vendor id: HITACHI
vendor specific: 5030C3502025
Designation descriptor number 2, descriptor length: 6
designator_type: vendor specific [0x0], code_set: Binary
associated with the Target port
vendor specific: 08 03
Designation descriptor number 3, descriptor length: 20
designator_type: NAA, code_set: Binary
associated with the Addressed logical unit
NAA 6, IEEE Company_id: 0x60e8
Vendor Specific Identifier: 0x7c35000
Vendor Specific Identifier Extension: 0x30c35000002025
[0x60060e8007c350000030c35000002025]
The current code would use the first descriptor because it's longer than
the NAA descriptor. But this is wrong, the kernel is supposed to prefer NAA
descriptors over T10 vendor ID. Designator length should only be used to
compare designators of the same type.
This patch addresses the issue by separating designator priority and
length.
Link: https://lore.kernel.org/r/20201029170846.14786-1-mwilck@suse.com
Fixes: 9983bed3907c ("scsi: Add scsi_vpd_lun_id()")
Reviewed-by: Hannes Reinecke <hare@suse.de>
Signed-off-by: Martin Wilck <mwilck@suse.com>
Signed-off-by: Martin K. Petersen <martin.petersen@oracle.com>
2020-10-29 20:08:45 +03:00
u8 cur_id_prio = 0 ;
2015-12-01 12:16:55 +03:00
u8 cur_id_size = 0 ;
2017-08-29 18:50:13 +03:00
const unsigned char * d , * cur_id_str ;
const struct scsi_vpd * vpd_pg83 ;
2015-12-01 12:16:55 +03:00
int id_size = - EINVAL ;
rcu_read_lock ( ) ;
vpd_pg83 = rcu_dereference ( sdev - > vpd_pg83 ) ;
if ( ! vpd_pg83 ) {
rcu_read_unlock ( ) ;
return - ENXIO ;
}
/* The id string must be at least 20 bytes + terminating NULL byte */
if ( id_len < 21 ) {
rcu_read_unlock ( ) ;
return - EINVAL ;
}
memset ( id , 0 , id_len ) ;
2020-10-29 20:08:46 +03:00
for ( d = vpd_pg83 - > data + 4 ;
d < vpd_pg83 - > data + vpd_pg83 - > len ;
d + = d [ 3 ] + 4 ) {
scsi: core: Fix VPD LUN ID designator priorities
The current implementation of scsi_vpd_lun_id() uses the designator length
as an implicit measure of priority. This works most of the time, but not
always. For example, some Hitachi storage arrays return this in VPD 0x83:
VPD INQUIRY: Device Identification page
Designation descriptor number 1, descriptor length: 24
designator_type: T10 vendor identification, code_set: ASCII
associated with the Addressed logical unit
vendor id: HITACHI
vendor specific: 5030C3502025
Designation descriptor number 2, descriptor length: 6
designator_type: vendor specific [0x0], code_set: Binary
associated with the Target port
vendor specific: 08 03
Designation descriptor number 3, descriptor length: 20
designator_type: NAA, code_set: Binary
associated with the Addressed logical unit
NAA 6, IEEE Company_id: 0x60e8
Vendor Specific Identifier: 0x7c35000
Vendor Specific Identifier Extension: 0x30c35000002025
[0x60060e8007c350000030c35000002025]
The current code would use the first descriptor because it's longer than
the NAA descriptor. But this is wrong, the kernel is supposed to prefer NAA
descriptors over T10 vendor ID. Designator length should only be used to
compare designators of the same type.
This patch addresses the issue by separating designator priority and
length.
Link: https://lore.kernel.org/r/20201029170846.14786-1-mwilck@suse.com
Fixes: 9983bed3907c ("scsi: Add scsi_vpd_lun_id()")
Reviewed-by: Hannes Reinecke <hare@suse.de>
Signed-off-by: Martin Wilck <mwilck@suse.com>
Signed-off-by: Martin K. Petersen <martin.petersen@oracle.com>
2020-10-29 20:08:45 +03:00
u8 prio = designator_prio ( d ) ;
if ( prio = = 0 | | cur_id_prio > prio )
2020-10-29 20:08:46 +03:00
continue ;
2015-12-01 12:16:55 +03:00
switch ( d [ 1 ] & 0xf ) {
2016-05-09 10:14:29 +03:00
case 0x1 :
/* T10 Vendor ID */
if ( cur_id_size > d [ 3 ] )
break ;
scsi: core: Fix VPD LUN ID designator priorities
The current implementation of scsi_vpd_lun_id() uses the designator length
as an implicit measure of priority. This works most of the time, but not
always. For example, some Hitachi storage arrays return this in VPD 0x83:
VPD INQUIRY: Device Identification page
Designation descriptor number 1, descriptor length: 24
designator_type: T10 vendor identification, code_set: ASCII
associated with the Addressed logical unit
vendor id: HITACHI
vendor specific: 5030C3502025
Designation descriptor number 2, descriptor length: 6
designator_type: vendor specific [0x0], code_set: Binary
associated with the Target port
vendor specific: 08 03
Designation descriptor number 3, descriptor length: 20
designator_type: NAA, code_set: Binary
associated with the Addressed logical unit
NAA 6, IEEE Company_id: 0x60e8
Vendor Specific Identifier: 0x7c35000
Vendor Specific Identifier Extension: 0x30c35000002025
[0x60060e8007c350000030c35000002025]
The current code would use the first descriptor because it's longer than
the NAA descriptor. But this is wrong, the kernel is supposed to prefer NAA
descriptors over T10 vendor ID. Designator length should only be used to
compare designators of the same type.
This patch addresses the issue by separating designator priority and
length.
Link: https://lore.kernel.org/r/20201029170846.14786-1-mwilck@suse.com
Fixes: 9983bed3907c ("scsi: Add scsi_vpd_lun_id()")
Reviewed-by: Hannes Reinecke <hare@suse.de>
Signed-off-by: Martin Wilck <mwilck@suse.com>
Signed-off-by: Martin K. Petersen <martin.petersen@oracle.com>
2020-10-29 20:08:45 +03:00
cur_id_prio = prio ;
2016-05-09 10:14:29 +03:00
cur_id_size = d [ 3 ] ;
if ( cur_id_size + 4 > id_len )
cur_id_size = id_len - 4 ;
cur_id_str = d + 4 ;
id_size = snprintf ( id , id_len , " t10.%*pE " ,
cur_id_size , cur_id_str ) ;
break ;
2015-12-01 12:16:55 +03:00
case 0x2 :
/* EUI-64 */
scsi: core: Fix VPD LUN ID designator priorities
The current implementation of scsi_vpd_lun_id() uses the designator length
as an implicit measure of priority. This works most of the time, but not
always. For example, some Hitachi storage arrays return this in VPD 0x83:
VPD INQUIRY: Device Identification page
Designation descriptor number 1, descriptor length: 24
designator_type: T10 vendor identification, code_set: ASCII
associated with the Addressed logical unit
vendor id: HITACHI
vendor specific: 5030C3502025
Designation descriptor number 2, descriptor length: 6
designator_type: vendor specific [0x0], code_set: Binary
associated with the Target port
vendor specific: 08 03
Designation descriptor number 3, descriptor length: 20
designator_type: NAA, code_set: Binary
associated with the Addressed logical unit
NAA 6, IEEE Company_id: 0x60e8
Vendor Specific Identifier: 0x7c35000
Vendor Specific Identifier Extension: 0x30c35000002025
[0x60060e8007c350000030c35000002025]
The current code would use the first descriptor because it's longer than
the NAA descriptor. But this is wrong, the kernel is supposed to prefer NAA
descriptors over T10 vendor ID. Designator length should only be used to
compare designators of the same type.
This patch addresses the issue by separating designator priority and
length.
Link: https://lore.kernel.org/r/20201029170846.14786-1-mwilck@suse.com
Fixes: 9983bed3907c ("scsi: Add scsi_vpd_lun_id()")
Reviewed-by: Hannes Reinecke <hare@suse.de>
Signed-off-by: Martin Wilck <mwilck@suse.com>
Signed-off-by: Martin K. Petersen <martin.petersen@oracle.com>
2020-10-29 20:08:45 +03:00
cur_id_prio = prio ;
2015-12-01 12:16:55 +03:00
cur_id_size = d [ 3 ] ;
cur_id_str = d + 4 ;
switch ( cur_id_size ) {
case 8 :
id_size = snprintf ( id , id_len ,
" eui.%8phN " ,
cur_id_str ) ;
break ;
case 12 :
id_size = snprintf ( id , id_len ,
" eui.%12phN " ,
cur_id_str ) ;
break ;
case 16 :
id_size = snprintf ( id , id_len ,
" eui.%16phN " ,
cur_id_str ) ;
break ;
default :
break ;
}
break ;
case 0x3 :
/* NAA */
scsi: core: Fix VPD LUN ID designator priorities
The current implementation of scsi_vpd_lun_id() uses the designator length
as an implicit measure of priority. This works most of the time, but not
always. For example, some Hitachi storage arrays return this in VPD 0x83:
VPD INQUIRY: Device Identification page
Designation descriptor number 1, descriptor length: 24
designator_type: T10 vendor identification, code_set: ASCII
associated with the Addressed logical unit
vendor id: HITACHI
vendor specific: 5030C3502025
Designation descriptor number 2, descriptor length: 6
designator_type: vendor specific [0x0], code_set: Binary
associated with the Target port
vendor specific: 08 03
Designation descriptor number 3, descriptor length: 20
designator_type: NAA, code_set: Binary
associated with the Addressed logical unit
NAA 6, IEEE Company_id: 0x60e8
Vendor Specific Identifier: 0x7c35000
Vendor Specific Identifier Extension: 0x30c35000002025
[0x60060e8007c350000030c35000002025]
The current code would use the first descriptor because it's longer than
the NAA descriptor. But this is wrong, the kernel is supposed to prefer NAA
descriptors over T10 vendor ID. Designator length should only be used to
compare designators of the same type.
This patch addresses the issue by separating designator priority and
length.
Link: https://lore.kernel.org/r/20201029170846.14786-1-mwilck@suse.com
Fixes: 9983bed3907c ("scsi: Add scsi_vpd_lun_id()")
Reviewed-by: Hannes Reinecke <hare@suse.de>
Signed-off-by: Martin Wilck <mwilck@suse.com>
Signed-off-by: Martin K. Petersen <martin.petersen@oracle.com>
2020-10-29 20:08:45 +03:00
cur_id_prio = prio ;
2015-12-01 12:16:55 +03:00
cur_id_size = d [ 3 ] ;
cur_id_str = d + 4 ;
switch ( cur_id_size ) {
case 8 :
id_size = snprintf ( id , id_len ,
" naa.%8phN " ,
cur_id_str ) ;
break ;
case 16 :
id_size = snprintf ( id , id_len ,
" naa.%16phN " ,
cur_id_str ) ;
break ;
default :
break ;
}
break ;
case 0x8 :
/* SCSI name string */
scsi: core: Fix VPD LUN ID designator priorities
The current implementation of scsi_vpd_lun_id() uses the designator length
as an implicit measure of priority. This works most of the time, but not
always. For example, some Hitachi storage arrays return this in VPD 0x83:
VPD INQUIRY: Device Identification page
Designation descriptor number 1, descriptor length: 24
designator_type: T10 vendor identification, code_set: ASCII
associated with the Addressed logical unit
vendor id: HITACHI
vendor specific: 5030C3502025
Designation descriptor number 2, descriptor length: 6
designator_type: vendor specific [0x0], code_set: Binary
associated with the Target port
vendor specific: 08 03
Designation descriptor number 3, descriptor length: 20
designator_type: NAA, code_set: Binary
associated with the Addressed logical unit
NAA 6, IEEE Company_id: 0x60e8
Vendor Specific Identifier: 0x7c35000
Vendor Specific Identifier Extension: 0x30c35000002025
[0x60060e8007c350000030c35000002025]
The current code would use the first descriptor because it's longer than
the NAA descriptor. But this is wrong, the kernel is supposed to prefer NAA
descriptors over T10 vendor ID. Designator length should only be used to
compare designators of the same type.
This patch addresses the issue by separating designator priority and
length.
Link: https://lore.kernel.org/r/20201029170846.14786-1-mwilck@suse.com
Fixes: 9983bed3907c ("scsi: Add scsi_vpd_lun_id()")
Reviewed-by: Hannes Reinecke <hare@suse.de>
Signed-off-by: Martin Wilck <mwilck@suse.com>
Signed-off-by: Martin K. Petersen <martin.petersen@oracle.com>
2020-10-29 20:08:45 +03:00
if ( cur_id_size > d [ 3 ] )
2015-12-01 12:16:55 +03:00
break ;
/* Prefer others for truncated descriptor */
scsi: core: Fix VPD LUN ID designator priorities
The current implementation of scsi_vpd_lun_id() uses the designator length
as an implicit measure of priority. This works most of the time, but not
always. For example, some Hitachi storage arrays return this in VPD 0x83:
VPD INQUIRY: Device Identification page
Designation descriptor number 1, descriptor length: 24
designator_type: T10 vendor identification, code_set: ASCII
associated with the Addressed logical unit
vendor id: HITACHI
vendor specific: 5030C3502025
Designation descriptor number 2, descriptor length: 6
designator_type: vendor specific [0x0], code_set: Binary
associated with the Target port
vendor specific: 08 03
Designation descriptor number 3, descriptor length: 20
designator_type: NAA, code_set: Binary
associated with the Addressed logical unit
NAA 6, IEEE Company_id: 0x60e8
Vendor Specific Identifier: 0x7c35000
Vendor Specific Identifier Extension: 0x30c35000002025
[0x60060e8007c350000030c35000002025]
The current code would use the first descriptor because it's longer than
the NAA descriptor. But this is wrong, the kernel is supposed to prefer NAA
descriptors over T10 vendor ID. Designator length should only be used to
compare designators of the same type.
This patch addresses the issue by separating designator priority and
length.
Link: https://lore.kernel.org/r/20201029170846.14786-1-mwilck@suse.com
Fixes: 9983bed3907c ("scsi: Add scsi_vpd_lun_id()")
Reviewed-by: Hannes Reinecke <hare@suse.de>
Signed-off-by: Martin Wilck <mwilck@suse.com>
Signed-off-by: Martin K. Petersen <martin.petersen@oracle.com>
2020-10-29 20:08:45 +03:00
if ( d [ 3 ] > id_len ) {
prio = 2 ;
if ( cur_id_prio > prio )
break ;
}
cur_id_prio = prio ;
2015-12-01 12:16:55 +03:00
cur_id_size = id_size = d [ 3 ] ;
cur_id_str = d + 4 ;
if ( cur_id_size > = id_len )
cur_id_size = id_len - 1 ;
memcpy ( id , cur_id_str , cur_id_size ) ;
break ;
default :
break ;
}
}
rcu_read_unlock ( ) ;
return id_size ;
}
EXPORT_SYMBOL ( scsi_vpd_lun_id ) ;
2015-12-01 12:16:57 +03:00
/*
* scsi_vpd_tpg_id - return a target port group identifier
* @ sdev : SCSI device
*
* Returns the Target Port Group identifier from the information
* froom VPD page 0x83 of the device .
*
* Returns the identifier or error on failure .
*/
int scsi_vpd_tpg_id ( struct scsi_device * sdev , int * rel_id )
{
2017-08-29 18:50:13 +03:00
const unsigned char * d ;
const struct scsi_vpd * vpd_pg83 ;
2015-12-01 12:16:57 +03:00
int group_id = - EAGAIN , rel_port = - 1 ;
rcu_read_lock ( ) ;
vpd_pg83 = rcu_dereference ( sdev - > vpd_pg83 ) ;
if ( ! vpd_pg83 ) {
rcu_read_unlock ( ) ;
return - ENXIO ;
}
2017-08-29 18:50:13 +03:00
d = vpd_pg83 - > data + 4 ;
while ( d < vpd_pg83 - > data + vpd_pg83 - > len ) {
2015-12-01 12:16:57 +03:00
switch ( d [ 1 ] & 0xf ) {
case 0x4 :
/* Relative target port */
rel_port = get_unaligned_be16 ( & d [ 6 ] ) ;
break ;
case 0x5 :
/* Target port group */
group_id = get_unaligned_be16 ( & d [ 6 ] ) ;
break ;
default :
break ;
}
d + = d [ 3 ] + 4 ;
}
rcu_read_unlock ( ) ;
if ( group_id > = 0 & & rel_id & & rel_port ! = - 1 )
* rel_id = rel_port ;
return group_id ;
}
EXPORT_SYMBOL ( scsi_vpd_tpg_id ) ;
2021-04-27 11:30:13 +03:00
/**
* scsi_build_sense - build sense data for a command
* @ scmd : scsi command for which the sense should be formatted
* @ desc : Sense format ( non - zero = = descriptor format ,
* 0 = = fixed format )
* @ key : Sense key
* @ asc : Additional sense code
* @ ascq : Additional sense code qualifier
*
* */
void scsi_build_sense ( struct scsi_cmnd * scmd , int desc , u8 key , u8 asc , u8 ascq )
{
scsi_build_sense_buffer ( desc , scmd - > sense_buffer , key , asc , ascq ) ;
2021-04-27 11:30:15 +03:00
scmd - > result = SAM_STAT_CHECK_CONDITION ;
2021-04-27 11:30:13 +03:00
}
EXPORT_SYMBOL_GPL ( scsi_build_sense ) ;