All of lore.kernel.org
 help / color / mirror / Atom feed
From: Hannes Reinecke <hare@suse.de>
To: Christoph Hellwig <hch@lst.de>
Cc: "Martin K. Petersen" <martin.petersen@oracle.com>,
	James Bottomley <jbottomley@odin.com>,
	Ewan Milne <emilne@redhat.com>,
	Bart van Assche <bart.vanassche@sandisk.com>,
	linux-scsi@vger.kernel.org
Subject: Re: [PATCH 13/20] scsi_dh_alua: Recheck state on unit attention
Date: Thu, 31 Dec 2015 15:02:16 +0100	[thread overview]
Message-ID: <56853568.1040606@suse.de> (raw)
In-Reply-To: <20151230132258.GC15270@lst.de>

On 12/30/2015 02:22 PM, Christoph Hellwig wrote:
> On Tue, Dec 08, 2015 at 08:37:33AM +0100, Hannes Reinecke wrote:
>> When we receive a unit attention code of 'ALUA state changed'
>> we should recheck the state, as it might be due to an implicit
>> ALUA state transition. This allows us to return NEEDS_RETRY
>> instead of ADD_TO_MLQUEUE, allowing to terminate the retries
>> after a certain time.
>> At the same time a workqueue item might already be queued, which
>> should be started immediately to avoid any delays.
>>
>> Signed-off-by: Hannes Reinecke <hare@suse.de>
>> ---
>>   drivers/scsi/device_handler/scsi_dh_alua.c | 58 ++++++++++++++++++++++++------
>>   1 file changed, 47 insertions(+), 11 deletions(-)
>>
>> diff --git a/drivers/scsi/device_handler/scsi_dh_alua.c b/drivers/scsi/device_handler/scsi_dh_alua.c
>> index 525449f..04a3a543 100644
>> --- a/drivers/scsi/device_handler/scsi_dh_alua.c
>> +++ b/drivers/scsi/device_handler/scsi_dh_alua.c
>> @@ -121,7 +121,8 @@ struct alua_queue_data {
>>   static void alua_rtpg_work(struct work_struct *work);
>>   static void alua_rtpg_queue(struct alua_port_group *pg,
>>   			    struct scsi_device *sdev,
>> -			    struct alua_queue_data *qdata);
>> +			    struct alua_queue_data *qdata, bool force);
>> +static void alua_check(struct scsi_device *sdev, bool force);
>>
>>   static void release_port_group(struct kref *kref)
>>   {
>> @@ -386,7 +387,7 @@ static int alua_check_vpd(struct scsi_device *sdev, struct alua_dh_data *h,
>>   		rcu_assign_pointer(h->pg, pg);
>>   		pg_found = true;
>>   	}
>> -	alua_rtpg_queue(h->pg, sdev, NULL);
>> +	alua_rtpg_queue(h->pg, sdev, NULL, true);
>>   	spin_unlock(&h->pg_lock);
>>
>>   	if (pg_found)
>> @@ -427,18 +428,24 @@ static int alua_check_sense(struct scsi_device *sdev,
>>   {
>>   	switch (sense_hdr->sense_key) {
>>   	case NOT_READY:
>> -		if (sense_hdr->asc == 0x04 && sense_hdr->ascq == 0x0a)
>> +		if (sense_hdr->asc == 0x04 && sense_hdr->ascq == 0x0a) {
>>   			/*
>>   			 * LUN Not Accessible - ALUA state transition
>>   			 */
>> -			return ADD_TO_MLQUEUE;
>> +			alua_check(sdev, false);
>> +			return NEEDS_RETRY;
>> +		}
>>   		break;
>>   	case UNIT_ATTENTION:
>> -		if (sense_hdr->asc == 0x29 && sense_hdr->ascq == 0x00)
>> +		if (sense_hdr->asc == 0x29 && sense_hdr->ascq == 0x00) {
>>   			/*
>> -			 * Power On, Reset, or Bus Device Reset, just retry.
>> +			 * Power On, Reset, or Bus Device Reset.
>> +			 * Might have obscured a state transition,
>> +			 * so schedule a recheck.
>>   			 */
>> +			alua_check(sdev, true);
>>   			return ADD_TO_MLQUEUE;
>> +		}
>>   		if (sense_hdr->asc == 0x29 && sense_hdr->ascq == 0x04)
>>   			/*
>>   			 * Device internal reset
>> @@ -449,16 +456,20 @@ static int alua_check_sense(struct scsi_device *sdev,
>>   			 * Mode Parameters Changed
>>   			 */
>>   			return ADD_TO_MLQUEUE;
>> -		if (sense_hdr->asc == 0x2a && sense_hdr->ascq == 0x06)
>> +		if (sense_hdr->asc == 0x2a && sense_hdr->ascq == 0x06) {
>>   			/*
>>   			 * ALUA state changed
>>   			 */
>> +			alua_check(sdev, true);
>>   			return ADD_TO_MLQUEUE;
>> -		if (sense_hdr->asc == 0x2a && sense_hdr->ascq == 0x07)
>> +		}
>> +		if (sense_hdr->asc == 0x2a && sense_hdr->ascq == 0x07) {
>>   			/*
>>   			 * Implicit ALUA state transition failed
>>   			 */
>> +			alua_check(sdev, true);
>>   			return ADD_TO_MLQUEUE;
>> +		}
>>   		if (sense_hdr->asc == 0x3f && sense_hdr->ascq == 0x03)
>>   			/*
>>   			 * Inquiry data has changed
>> @@ -777,7 +788,7 @@ static void alua_rtpg_work(struct work_struct *work)
>>
>>   static void alua_rtpg_queue(struct alua_port_group *pg,
>>   			    struct scsi_device *sdev,
>> -			    struct alua_queue_data *qdata)
>> +			    struct alua_queue_data *qdata, bool force)
>>   {
>>   	int start_queue = 0;
>>   	unsigned long flags;
>> @@ -797,7 +808,9 @@ static void alua_rtpg_queue(struct alua_port_group *pg,
>>   		pg->rtpg_sdev = sdev;
>>   		scsi_device_get(sdev);
>>   		start_queue = 1;
>> -	}
>> +	} else if (!(pg->flags & ALUA_PG_RUN_RTPG) && force)
>> +		start_queue = 1;
>> +
>>   	spin_unlock_irqrestore(&pg->lock, flags);
>>
>>   	if (start_queue &&
>> @@ -912,7 +925,7 @@ static int alua_activate(struct scsi_device *sdev,
>>   	kref_get(&pg->kref);
>>   	rcu_read_unlock();
>>
>> -	alua_rtpg_queue(pg, sdev, qdata);
>> +	alua_rtpg_queue(pg, sdev, qdata, true);
>>   	kref_put(&pg->kref, release_port_group);
>>   out:
>>   	if (fn)
>> @@ -921,6 +934,29 @@ out:
>>   }
>>
>>   /*
>> + * alua_check - check path status
>> + * @sdev: device on the path to be checked
>> + *
>> + * Check the device status
>> + */
>> +static void alua_check(struct scsi_device *sdev, bool force)
>> +{
>> +	struct alua_dh_data *h = sdev->handler_data;
>> +	struct alua_port_group *pg;
>> +
>> +	rcu_read_lock();
>> +	pg = rcu_dereference(h->pg);
>> +	if (!pg) {
>> +		rcu_read_unlock();
>> +		return;
>> +	}
>> +	kref_get(&pg->kref);
>
> What protects us from pg->kref beeing released?  I think the whole
> refcounting scheme needs an audit to see where kref_get is called
> without synchronization and use kref_get_unless_zero where needed.
>
Hehe. This really is a bit of an awkward point. The overall idea here is 
that rcu_dereference() will give us a port_group structure.
But seeing that this pointer is not necessarily synchronized we need to 
use kref_get_unless_zero here, true.

Cheers,

Hannes
-- 
Dr. Hannes Reinecke		      zSeries & Storage
hare@suse.de			      +49 911 74053 688
SUSE LINUX Products GmbH, Maxfeldstr. 5, 90409 Nürnberg
GF: J. Hawn, J. Guild, F. Imendörffer, HRB 16746 (AG Nürnberg)
--
To unsubscribe from this list: send the line "unsubscribe linux-scsi" in
the body of a message to majordomo@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

  reply	other threads:[~2015-12-31 14:02 UTC|newest]

Thread overview: 49+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2015-12-08  7:37 [PATCH 00/20] ALUA device handler update, part II Hannes Reinecke
2015-12-08  7:37 ` [PATCH 01/20] scsi_dh_alua: Pass buffer as function argument Hannes Reinecke
2015-12-08  7:37 ` [PATCH 02/20] scsi_dh_alua: separate out alua_stpg() Hannes Reinecke
2015-12-30 11:06   ` Christoph Hellwig
2015-12-08  7:37 ` [PATCH 03/20] scsi_dh_alua: Make stpg synchronous Hannes Reinecke
2015-12-30 11:10   ` Christoph Hellwig
2015-12-08  7:37 ` [PATCH 04/20] scsi_dh_alua: call alua_rtpg() if stpg fails Hannes Reinecke
2015-12-30 11:10   ` Christoph Hellwig
2015-12-08  7:37 ` [PATCH 05/20] scsi_dh_alua: switch to scsi_execute_req_flags() Hannes Reinecke
2015-12-08  7:37 ` [PATCH 06/20] scsi_dh_alua: Use separate alua_port_group structure Hannes Reinecke
2015-12-30 11:17   ` Christoph Hellwig
2015-12-31 12:47     ` Hannes Reinecke
2015-12-08  7:37 ` [PATCH 07/20] scsi_dh_alua: allocate RTPG buffer separately Hannes Reinecke
2015-12-08  7:37 ` [PATCH 08/20] scsi_dh_alua: use unique device id Hannes Reinecke
2015-12-30 11:20   ` Christoph Hellwig
2015-12-31 12:53     ` Hannes Reinecke
2015-12-08  7:37 ` [PATCH 09/20] scsi_dh_alua: simplify alua_initialize() Hannes Reinecke
2015-12-30 11:21   ` Christoph Hellwig
2015-12-08  7:37 ` [PATCH 10/20] revert commit a8e5a2d593cb ("[SCSI] scsi_dh_alua: ALUA handler attach should succeed while TPG is transitioning") Hannes Reinecke
2015-12-30 11:22   ` Christoph Hellwig
2015-12-31 12:54     ` Hannes Reinecke
2015-12-08  7:37 ` [PATCH 11/20] scsi_dh_alua: Use workqueue for RTPG Hannes Reinecke
2015-12-30 13:19   ` Christoph Hellwig
2015-12-31 13:01     ` Hannes Reinecke
2016-01-03 10:53       ` Christoph Hellwig
2015-12-08  7:37 ` [PATCH 12/20] scsi_dh_alua: Allow workqueue to run synchronously Hannes Reinecke
2015-12-30 13:20   ` Christoph Hellwig
2015-12-31 13:54     ` Hannes Reinecke
2016-01-03 10:54       ` Christoph Hellwig
2015-12-08  7:37 ` [PATCH 13/20] scsi_dh_alua: Recheck state on unit attention Hannes Reinecke
2015-12-30 13:22   ` Christoph Hellwig
2015-12-31 14:02     ` Hannes Reinecke [this message]
2015-12-08  7:37 ` [PATCH 14/20] scsi_dh_alua: update all port states Hannes Reinecke
2015-12-30 13:23   ` Christoph Hellwig
2015-12-31 14:09     ` Hannes Reinecke
2015-12-08  7:37 ` [PATCH 15/20] scsi_dh_alua: Send TEST UNIT READY to poll for transitioning Hannes Reinecke
2015-12-30 13:24   ` Christoph Hellwig
2015-12-08  7:37 ` [PATCH 16/20] scsi_dh: add 'rescan' callback Hannes Reinecke
2015-12-30 13:24   ` Christoph Hellwig
2015-12-08  7:37 ` [PATCH 17/20] scsi: Add 'access_state' attribute Hannes Reinecke
2015-12-30 13:24   ` Christoph Hellwig
2015-12-30 13:26   ` Christoph Hellwig
2015-12-08  7:37 ` [PATCH 18/20] scsi_dh_alua: use common definitions for ALUA state Hannes Reinecke
2015-12-30 13:28   ` Christoph Hellwig
2015-12-08  7:37 ` [PATCH 19/20] scsi_dh_alua: update 'access_state' field Hannes Reinecke
2015-12-30 13:34   ` Christoph Hellwig
2015-12-31 14:15     ` Hannes Reinecke
2015-12-08  7:37 ` [PATCH 20/20] scsi_dh_alua: Update version to 2.0 Hannes Reinecke
2015-12-08 15:06 ` [PATCH 00/20] ALUA device handler update, part II Hannes Reinecke

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=56853568.1040606@suse.de \
    --to=hare@suse.de \
    --cc=bart.vanassche@sandisk.com \
    --cc=emilne@redhat.com \
    --cc=hch@lst.de \
    --cc=jbottomley@odin.com \
    --cc=linux-scsi@vger.kernel.org \
    --cc=martin.petersen@oracle.com \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line before the message body.
This is an external index of several public inboxes,
see mirroring instructions on how to clone and mirror
all data and code used by this external index.