From: Hannes Reinecke <hare@suse.de>
To: Christoph Hellwig <hch@lst.de>,
James Bottomley <James.Bottomley@HansenPartnership.com>
Cc: Jens Axboe <axboe@kernel.dk>,
Bart Van Assche <bvanassche@fusionio.com>,
Robert Elliott <Elliott@hp.com>,
linux-scsi@vger.kernel.org, linux-kernel@vger.kernel.org
Subject: Re: [PATCH 09/14] scsi: fix the {host,target,device}_blocked counter mess
Date: Wed, 09 Jul 2014 13:12:17 +0200 [thread overview]
Message-ID: <53BD2391.90800@suse.de> (raw)
In-Reply-To: <1403715121-1201-10-git-send-email-hch@lst.de>
On 06/25/2014 06:51 PM, Christoph Hellwig wrote:
> Seems like these counters are missing any sort of synchronization for
> updates, as a over 10 year old comment from me noted. Fix this by
> using atomic counters, and while we're at it also make sure they are
> in the same cacheline as the _busy counters and not needlessly stored
> to in every I/O completion.
>
> With the new model the _busy counters can temporarily go negative,
> so all the readers are updated to check for > 0 values. Longer
> term every successful I/O completion will reset the counters to zero,
> so the temporarily negative values will not cause any harm.
>
> Signed-off-by: Christoph Hellwig <hch@lst.de>
> ---
> drivers/scsi/scsi.c | 21 ++++++------
> drivers/scsi/scsi_lib.c | 82 +++++++++++++++++++++-----------------------
> drivers/scsi/scsi_sysfs.c | 10 +++++-
> include/scsi/scsi_device.h | 7 ++--
> include/scsi/scsi_host.h | 7 ++--
> 5 files changed, 64 insertions(+), 63 deletions(-)
>
> diff --git a/drivers/scsi/scsi.c b/drivers/scsi/scsi.c
> index 35a23e2..b362058 100644
> --- a/drivers/scsi/scsi.c
> +++ b/drivers/scsi/scsi.c
> @@ -729,17 +729,16 @@ void scsi_finish_command(struct scsi_cmnd *cmd)
>
> scsi_device_unbusy(sdev);
>
> - /*
> - * Clear the flags which say that the device/host is no longer
> - * capable of accepting new commands. These are set in scsi_queue.c
> - * for both the queue full condition on a device, and for a
> - * host full condition on the host.
> - *
> - * XXX(hch): What about locking?
> - */
> - shost->host_blocked = 0;
> - starget->target_blocked = 0;
> - sdev->device_blocked = 0;
> + /*
> + * Clear the flags which say that the device/target/host is no longer
> + * capable of accepting new commands.
> + */
> + if (atomic_read(&shost->host_blocked))
> + atomic_set(&shost->host_blocked, 0);
> + if (atomic_read(&starget->target_blocked))
> + atomic_set(&starget->target_blocked, 0);
> + if (atomic_read(&sdev->device_blocked))
> + atomic_set(&sdev->device_blocked, 0);
>
> /*
> * If we have valid sense information, then some kind of recovery
Hmm. I guess there is a race window between
atomic_read() and atomic_set().
Doesn't this cause issues when someone calls atomic_set() just
before the call to atomic_read?
> diff --git a/drivers/scsi/scsi_lib.c b/drivers/scsi/scsi_lib.c
> index e23fef5..a39d5ba 100644
> --- a/drivers/scsi/scsi_lib.c
> +++ b/drivers/scsi/scsi_lib.c
> @@ -99,14 +99,16 @@ scsi_set_blocked(struct scsi_cmnd *cmd, int reason)
> */
> switch (reason) {
> case SCSI_MLQUEUE_HOST_BUSY:
> - host->host_blocked = host->max_host_blocked;
> + atomic_set(&host->host_blocked, host->max_host_blocked);
> break;
> case SCSI_MLQUEUE_DEVICE_BUSY:
> case SCSI_MLQUEUE_EH_RETRY:
> - device->device_blocked = device->max_device_blocked;
> + atomic_set(&device->device_blocked,
> + device->max_device_blocked);
> break;
> case SCSI_MLQUEUE_TARGET_BUSY:
> - starget->target_blocked = starget->max_target_blocked;
> + atomic_set(&starget->target_blocked,
> + starget->max_target_blocked);
> break;
> }
> }
> @@ -351,30 +353,39 @@ static void scsi_single_lun_run(struct scsi_device *current_sdev)
> spin_unlock_irqrestore(shost->host_lock, flags);
> }
>
> -static inline int scsi_device_is_busy(struct scsi_device *sdev)
> +static inline bool scsi_device_is_busy(struct scsi_device *sdev)
> {
> if (atomic_read(&sdev->device_busy) >= sdev->queue_depth)
> - return 1;
> - if (sdev->device_blocked)
> - return 1;
> + return true;
> + if (atomic_read(&sdev->device_blocked) > 0)
> + return true;
> return 0;
> }
>
> -static inline int scsi_target_is_busy(struct scsi_target *starget)
> +static inline bool scsi_target_is_busy(struct scsi_target *starget)
> {
> - return ((starget->can_queue > 0 &&
> - atomic_read(&starget->target_busy) >= starget->can_queue) ||
> - starget->target_blocked);
> + if (starget->can_queue > 0) {
> + if (atomic_read(&starget->target_busy) >= starget->can_queue)
> + return true;
> + if (atomic_read(&starget->target_blocked) > 0)
> + return true;
> + }
> +
> + return false;
> }
>
> -static inline int scsi_host_is_busy(struct Scsi_Host *shost)
> +static inline bool scsi_host_is_busy(struct Scsi_Host *shost)
> {
> - if ((shost->can_queue > 0 &&
> - atomic_read(&shost->host_busy) >= shost->can_queue) ||
> - shost->host_blocked || shost->host_self_blocked)
> - return 1;
> + if (shost->can_queue > 0) {
> + if (atomic_read(&shost->host_busy) >= shost->can_queue)
> + return true;
> + if (atomic_read(&shost->host_blocked) > 0)
> + return true;
> + if (shost->host_self_blocked)
> + return true;
> + }
>
> - return 0;
> + return false;
> }
>
> static void scsi_starved_list_run(struct Scsi_Host *shost)
> @@ -1283,11 +1294,8 @@ static inline int scsi_dev_queue_ready(struct request_queue *q,
> unsigned int busy;
>
> busy = atomic_inc_return(&sdev->device_busy) - 1;
> - if (busy == 0 && sdev->device_blocked) {
> - /*
> - * unblock after device_blocked iterates to zero
> - */
> - if (--sdev->device_blocked != 0) {
> + if (busy == 0 && atomic_read(&sdev->device_blocked) > 0) {
> + if (atomic_dec_return(&sdev->device_blocked) > 0) {
> blk_delay_queue(q, SCSI_QUEUE_DELAY);
> goto out_dec;
> }
> @@ -1297,7 +1305,7 @@ static inline int scsi_dev_queue_ready(struct request_queue *q,
>
> if (busy >= sdev->queue_depth)
> goto out_dec;
> - if (sdev->device_blocked)
> + if (atomic_read(&sdev->device_blocked) > 0)
> goto out_dec;
>
> return 1;
> @@ -1328,16 +1336,9 @@ static inline int scsi_target_queue_ready(struct Scsi_Host *shost,
> }
>
> busy = atomic_inc_return(&starget->target_busy) - 1;
> - if (busy == 0 && starget->target_blocked) {
> - /*
> - * unblock after target_blocked iterates to zero
> - */
> - spin_lock_irq(shost->host_lock);
> - if (--starget->target_blocked != 0) {
> - spin_unlock_irq(shost->host_lock);
> + if (busy == 0 && atomic_read(&starget->target_blocked) > 0) {
> + if (atomic_dec_return(&starget->target_blocked) > 0)
> goto out_dec;
> - }
> - spin_unlock_irq(shost->host_lock);
>
> SCSI_LOG_MLQUEUE(3, starget_printk(KERN_INFO, starget,
> "unblocking target at zero depth\n"));
> @@ -1345,7 +1346,7 @@ static inline int scsi_target_queue_ready(struct Scsi_Host *shost,
>
> if (starget->can_queue > 0 && busy >= starget->can_queue)
> goto starved;
> - if (starget->target_blocked)
> + if (atomic_read(&starget->target_blocked) > 0)
> goto starved;
>
> return 1;
> @@ -1374,16 +1375,9 @@ static inline int scsi_host_queue_ready(struct request_queue *q,
> return 0;
>
> busy = atomic_inc_return(&shost->host_busy) - 1;
> - if (busy == 0 && shost->host_blocked) {
> - /*
> - * unblock after host_blocked iterates to zero
> - */
> - spin_lock_irq(shost->host_lock);
> - if (--shost->host_blocked != 0) {
> - spin_unlock_irq(shost->host_lock);
> + if (busy == 0 && atomic_read(&shost->host_blocked) > 0) {
> + if (atomic_dec_return(&shost->host_blocked) > 0)
> goto out_dec;
> - }
> - spin_unlock_irq(shost->host_lock);
>
> SCSI_LOG_MLQUEUE(3,
> shost_printk(KERN_INFO, shost,
Same with this one.
Cheers,
Hannes
--
Dr. Hannes Reinecke zSeries & Storage
hare@suse.de +49 911 74053 688
SUSE LINUX Products GmbH, Maxfeldstr. 5, 90409 Nürnberg
GF: J. Hawn, J. Guild, F. Imendörffer, HRB 16746 (AG Nürnberg)
next prev parent reply other threads:[~2014-07-09 11:12 UTC|newest]
Thread overview: 86+ messages / expand[flat|nested] mbox.gz Atom feed top
2014-06-25 16:51 scsi-mq V2 Christoph Hellwig
2014-06-25 16:51 ` [PATCH 01/14] sd: don't use rq->cmd_len before setting it up Christoph Hellwig
2014-07-09 11:12 ` Hannes Reinecke
2014-07-09 15:03 ` Christoph Hellwig
2014-06-25 16:51 ` [PATCH 02/14] scsi: split __scsi_queue_insert Christoph Hellwig
2014-07-09 11:12 ` Hannes Reinecke
2014-06-25 16:51 ` [PATCH 03/14] scsi: centralize command re-queueing in scsi_dispatch_fn Christoph Hellwig
2014-07-08 20:51 ` Elliott, Robert (Server Storage)
2014-07-09 6:40 ` Christoph Hellwig
2014-07-09 11:13 ` Hannes Reinecke
2014-06-25 16:51 ` [PATCH 04/14] scsi: set ->scsi_done before calling scsi_dispatch_cmd Christoph Hellwig
2014-07-09 11:14 ` Hannes Reinecke
2014-06-25 16:51 ` [PATCH 05/14] scsi: push host_lock down into scsi_{host,target}_queue_ready Christoph Hellwig
2014-07-09 11:14 ` Hannes Reinecke
2014-06-25 16:51 ` [PATCH 06/14] scsi: convert target_busy to an atomic_t Christoph Hellwig
2014-07-09 11:15 ` Hannes Reinecke
2014-06-25 16:51 ` [PATCH 07/14] scsi: convert host_busy to atomic_t Christoph Hellwig
2014-07-09 11:15 ` Hannes Reinecke
2014-06-25 16:51 ` [PATCH 08/14] scsi: convert device_busy " Christoph Hellwig
2014-07-09 11:16 ` Hannes Reinecke
2014-07-09 16:49 ` James Bottomley
2014-07-10 6:01 ` Christoph Hellwig
2014-06-25 16:51 ` [PATCH 09/14] scsi: fix the {host,target,device}_blocked counter mess Christoph Hellwig
2014-07-09 11:12 ` Hannes Reinecke [this message]
2014-07-10 6:06 ` Christoph Hellwig
2014-06-25 16:51 ` [PATCH 10/14] scsi: only maintain target_blocked if the driver has a target queue limit Christoph Hellwig
2014-07-09 11:19 ` Hannes Reinecke
2014-07-09 15:05 ` Christoph Hellwig
2014-06-25 16:51 ` [PATCH 11/14] scsi: unwind blk_end_request_all and blk_end_request_err calls Christoph Hellwig
2014-07-09 11:20 ` Hannes Reinecke
2014-06-25 16:51 ` [PATCH 12/14] scatterlist: allow chaining to preallocated chunks Christoph Hellwig
2014-07-09 11:21 ` Hannes Reinecke
2014-06-25 16:52 ` [PATCH 13/14] scsi: add support for a blk-mq based I/O path Christoph Hellwig
2014-07-09 11:25 ` Hannes Reinecke
2014-07-16 11:13 ` Mike Christie
2014-07-16 11:16 ` Christoph Hellwig
2014-06-25 16:52 ` [PATCH 14/14] fnic: reject device resets without assigned tags for the blk-mq case Christoph Hellwig
2014-07-09 11:27 ` Hannes Reinecke
2014-06-26 4:50 ` scsi-mq V2 Jens Axboe
2014-06-26 22:07 ` Elliott, Robert (Server Storage)
2014-06-27 14:42 ` Bart Van Assche
2014-06-30 15:20 ` Jens Axboe
2014-06-30 15:25 ` Christoph Hellwig
2014-06-30 15:54 ` Martin K. Petersen
2014-07-08 14:48 ` Christoph Hellwig
2014-07-09 16:39 ` Douglas Gilbert
2014-07-09 19:38 ` Jens Axboe
2014-07-10 0:53 ` Elliott, Robert (Server Storage)
2014-07-10 6:20 ` Christoph Hellwig
2014-07-10 13:36 ` Benjamin LaHaise
2014-07-10 13:39 ` Jens Axboe
2014-07-10 13:44 ` Benjamin LaHaise
2014-07-10 13:48 ` Jens Axboe
2014-07-10 13:50 ` Benjamin LaHaise
2014-07-10 13:52 ` Jens Axboe
2014-07-10 13:50 ` Christoph Hellwig
2014-07-10 13:52 ` Jens Axboe
2014-07-10 14:36 ` Elliott, Robert (Server Storage)
2014-07-10 14:45 ` Benjamin LaHaise
2014-07-10 15:11 ` Jeff Moyer
2014-07-10 19:59 ` Jens Axboe
2014-07-10 20:05 ` Jeff Moyer
2014-07-10 20:06 ` Jens Axboe
2014-07-10 15:51 ` Elliott, Robert (Server Storage)
2014-07-10 16:04 ` Christoph Hellwig
2014-07-10 16:14 ` Christoph Hellwig
2014-07-10 18:49 ` Elliott, Robert (Server Storage)
2014-07-10 19:14 ` Jeff Moyer
2014-07-10 19:36 ` Jeff Moyer
2014-07-10 21:10 ` Elliott, Robert (Server Storage)
2014-07-11 6:02 ` Elliott, Robert (Server Storage)
2014-07-11 6:14 ` Christoph Hellwig
2014-07-11 14:33 ` Elliott, Robert (Server Storage)
2014-07-11 14:55 ` Benjamin LaHaise
2014-07-12 21:50 ` Elliott, Robert (Server Storage)
2014-07-12 23:20 ` Elliott, Robert (Server Storage)
2014-07-13 17:15 ` Elliott, Robert (Server Storage)
2014-07-14 17:15 ` Benjamin LaHaise
2014-07-14 9:13 ` Sagi Grimberg
2014-08-21 12:32 ` Performance degradation in IO writes vs. reads (was scsi-mq V2) Sagi Grimberg
2014-08-21 13:03 ` Christoph Hellwig
2014-08-21 14:02 ` Sagi Grimberg
2014-08-24 16:41 ` Sagi Grimberg
-- strict thread matches above, loose matches on Subject: below --
2014-07-18 10:12 scsi-mq V4 Christoph Hellwig
2014-07-18 10:13 ` [PATCH 09/14] scsi: fix the {host,target,device}_blocked counter mess Christoph Hellwig
2014-07-25 19:08 ` Martin K. Petersen
2014-06-12 13:48 scsi-mq Christoph Hellwig
2014-06-12 13:49 ` [PATCH 09/14] scsi: fix the {host,target,device}_blocked counter mess Christoph Hellwig
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=53BD2391.90800@suse.de \
--to=hare@suse.de \
--cc=Elliott@hp.com \
--cc=James.Bottomley@HansenPartnership.com \
--cc=axboe@kernel.dk \
--cc=bvanassche@fusionio.com \
--cc=hch@lst.de \
--cc=linux-kernel@vger.kernel.org \
--cc=linux-scsi@vger.kernel.org \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).