[PATCH] NVMe: Add support to receive NVMe asynchronous events

Linux-NVME Archive on lore.kernel.org
 help / color / mirror / Atom feed

* [PATCH] NVMe: Add support to receive NVMe asynchronous events
@ 2014-05-26 20:04 Winson Yung (wyung)
  2014-05-26 21:42 ` Keith Busch
  2014-05-26 23:51 ` Matthew Wilcox
  0 siblings, 2 replies; 11+ messages in thread
From: Winson Yung (wyung) @ 2014-05-26 20:04 UTC (permalink / raw)


As a NVMe mandatory admin command, this driver should be setup so
that it can receive drive critical asynchronous notification for
issue such as device reliability, temperature above threshold, or
available spare space fallen below threshould. This patch enables
very basic mechanism to log the asynchronous events in kernel log.

Signed-off-by: Winson Yung <wyung at micron.com>
---
 drivers/block/nvme-core.c |   57 +++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 57 insertions(+)

diff --git a/drivers/block/nvme-core.c b/drivers/block/nvme-core.c
index cd8a8bc7..4cd9f8e 100644
--- a/drivers/block/nvme-core.c
+++ b/drivers/block/nvme-core.c
@@ -198,6 +198,7 @@ static int alloc_cmdid_killable(struct nvme_queue *nvmeq, void *ctx,
 #define CMD_CTX_COMPLETED	(0x310 + CMD_CTX_BASE)
 #define CMD_CTX_INVALID		(0x314 + CMD_CTX_BASE)
 #define CMD_CTX_ABORT		(0x318 + CMD_CTX_BASE)
+#define CMD_CTX_ASYNC_EVENT	(0x319 + CMD_CTX_BASE)
 
 static void special_completion(struct nvme_queue *nvmeq, void *ctx,
 						struct nvme_completion *cqe)
@@ -227,7 +228,27 @@ static void special_completion(struct nvme_queue *nvmeq, void *ctx,
 static void async_completion(struct nvme_queue *nvmeq, void *ctx,
 						struct nvme_completion *cqe)
 {
+	int cmdid;
+	struct nvme_queue *adminq;
+	struct nvme_dev *dev = nvmeq->dev;
 	struct async_cmd_info *cmdinfo = ctx;
+
+	if (ctx == CMD_CTX_ASYNC_EVENT) {
+		dev_warn(nvmeq->q_dmadev, "An async event is detected (DW0:%X)\n",
+								cqe->result);
+
+		adminq = rcu_dereference(dev->queues[0]);
+
+		/* Allocate a cmdid entry for next async event */
+		cmdid = alloc_cmdid(adminq, CMD_CTX_ASYNC_EVENT,
+						async_completion, 0);
+		if (cmdid < 0)
+			dev_warn(nvmeq->q_dmadev,
+				"Failure creating new entry for next async event\n");
+
+		return; /* Report asynchronous critical event, and exit */
+	}
+
 	cmdinfo->result = le32_to_cpup(&cqe->result);
 	cmdinfo->status = le16_to_cpup(&cqe->status) >> 1;
 	queue_kthread_work(cmdinfo->worker, &cmdinfo->work);
@@ -2381,6 +2402,37 @@ static int nvme_delete_cq(struct nvme_queue *nvmeq)
 						nvme_del_cq_work_handler);
 }
 
+static int nvme_enable_async_events(struct nvme_dev *dev)
+{
+	int status, cmdid;
+	u32 result, async_events;
+	struct nvme_queue *adminq;
+
+	async_events = NVME_SMART_CRIT_SPARE |
+			NVME_SMART_CRIT_TEMPERATURE |
+			NVME_SMART_CRIT_RELIABILITY |
+			NVME_SMART_CRIT_MEDIA |
+			NVME_SMART_CRIT_VOLATILE_MEMORY;
+
+	status = nvme_set_features(dev, NVME_FEAT_ASYNC_EVENT,
+					async_events, 0, &result);
+
+	if (status < 0)
+		return status;
+
+	if (status > 0) {
+		dev_err(&dev->pci_dev->dev, "Could not enable async event (%d)\n",
+									status);
+		return -EBUSY;
+	}
+
+	adminq = rcu_dereference(dev->queues[0]);
+
+	/* Allocate a cmdid entry in preparation of next incoming async event */
+	cmdid = alloc_cmdid(adminq, CMD_CTX_ASYNC_EVENT, async_completion, 0);
+	return cmdid;
+}
+
 static void nvme_del_sq_work_handler(struct kthread_work *work)
 {
 	struct nvme_queue *nvmeq = container_of(work, struct nvme_queue,
@@ -2638,6 +2690,11 @@ static int nvme_dev_start(struct nvme_dev *dev)
 		goto disable;
 	}
 
+	/* Enable receive asynchronous event */
+	result = nvme_enable_async_events(dev);
+	if (result < 0 && result != -EBUSY)
+		goto disable;
+
 	result = nvme_setup_io_queues(dev);
 	if (result && result != -EBUSY)
 		goto disable;
-- 
1.7.9.5

^ permalink raw reply related	[flat|nested] 11+ messages in thread

* [PATCH] NVMe: Add support to receive NVMe asynchronous events
  2014-05-26 20:04 [PATCH] NVMe: Add support to receive NVMe asynchronous events Winson Yung (wyung)
@ 2014-05-26 21:42 ` Keith Busch
  2014-05-27  5:02   ` Winson Yung (wyung)
  2014-05-26 23:51 ` Matthew Wilcox
  1 sibling, 1 reply; 11+ messages in thread
From: Keith Busch @ 2014-05-26 21:42 UTC (permalink / raw)


On Mon, 26 May 2014, Winson Yung (wyung) wrote:
> As a NVMe mandatory admin command, this driver should be setup so
> that it can receive drive critical asynchronous notification for
> issue such as device reliability, temperature above threshold, or
> available spare space fallen below threshould. This patch enables
> very basic mechanism to log the asynchronous events in kernel log.
>
> Signed-off-by: Winson Yung <wyung at micron.com>
> ---
> drivers/block/nvme-core.c |   57 +++++++++++++++++++++++++++++++++++++++++++++
> 1 file changed, 57 insertions(+)
>
> diff --git a/drivers/block/nvme-core.c b/drivers/block/nvme-core.c
> index cd8a8bc7..4cd9f8e 100644
> --- a/drivers/block/nvme-core.c
> +++ b/drivers/block/nvme-core.c
> @@ -198,6 +198,7 @@ static int alloc_cmdid_killable(struct nvme_queue *nvmeq, void *ctx,
> #define CMD_CTX_COMPLETED	(0x310 + CMD_CTX_BASE)
> #define CMD_CTX_INVALID		(0x314 + CMD_CTX_BASE)
> #define CMD_CTX_ABORT		(0x318 + CMD_CTX_BASE)
> +#define CMD_CTX_ASYNC_EVENT	(0x319 + CMD_CTX_BASE)

Context needs to be dword aligned, so the next new context would be 0x31c.

> static void special_completion(struct nvme_queue *nvmeq, void *ctx,
> 						struct nvme_completion *cqe)
> @@ -227,7 +228,27 @@ static void special_completion(struct nvme_queue *nvmeq, void *ctx,
> static void async_completion(struct nvme_queue *nvmeq, void *ctx,
> 						struct nvme_completion *cqe)
> {
> +	int cmdid;
> +	struct nvme_queue *adminq;
> +	struct nvme_dev *dev = nvmeq->dev;
> 	struct async_cmd_info *cmdinfo = ctx;
> +
> +	if (ctx == CMD_CTX_ASYNC_EVENT) {
> +		dev_warn(nvmeq->q_dmadev, "An async event is detected (DW0:%X)\n",
> +								cqe->result);
> +
> +		adminq = rcu_dereference(dev->queues[0]);
> +
> +		/* Allocate a cmdid entry for next async event */
> +		cmdid = alloc_cmdid(adminq, CMD_CTX_ASYNC_EVENT,
> +						async_completion, 0);

You've allocated this new cmdid with no timeout, and then you do nothing
with the command id. It's just going to get timed out.

> +		if (cmdid < 0)
> +			dev_warn(nvmeq->q_dmadev,
> +				"Failure creating new entry for next async event\n");
> +
> +		return; /* Report asynchronous critical event, and exit */
> +	}
> +
> 	cmdinfo->result = le32_to_cpup(&cqe->result);
> 	cmdinfo->status = le16_to_cpup(&cqe->status) >> 1;
> 	queue_kthread_work(cmdinfo->worker, &cmdinfo->work);
> @@ -2381,6 +2402,37 @@ static int nvme_delete_cq(struct nvme_queue *nvmeq)
> 						nvme_del_cq_work_handler);
> }
>
> +static int nvme_enable_async_events(struct nvme_dev *dev)
> +{
> +	int status, cmdid;
> +	u32 result, async_events;
> +	struct nvme_queue *adminq;
> +
> +	async_events = NVME_SMART_CRIT_SPARE |
> +			NVME_SMART_CRIT_TEMPERATURE |
> +			NVME_SMART_CRIT_RELIABILITY |
> +			NVME_SMART_CRIT_MEDIA |
> +			NVME_SMART_CRIT_VOLATILE_MEMORY;
> +
> +	status = nvme_set_features(dev, NVME_FEAT_ASYNC_EVENT,
> +					async_events, 0, &result);

I think we'd rather let the user pick what events they want to see using
the passthrough IOCTL rather than have the driver decide these things.

> +
> +	if (status < 0)
> +		return status;
> +
> +	if (status > 0) {
> +		dev_err(&dev->pci_dev->dev, "Could not enable async event (%d)\n",
> +									status);
> +		return -EBUSY;
> +	}
> +
> +	adminq = rcu_dereference(dev->queues[0]);
> +
> +	/* Allocate a cmdid entry in preparation of next incoming async event */
> +	cmdid = alloc_cmdid(adminq, CMD_CTX_ASYNC_EVENT, async_completion, 0);

Same thing as in the completion, you're allocating a cmdid, but no
command is associated with it.

I don't think you want to use the "async_completion" callback either
(is it confusing to name that callback that way? :)) unless you have
some deferred work that needs to be done upon the completion that can't
be done in interrupt context.

> +	return cmdid;
> +}
> +
> static void nvme_del_sq_work_handler(struct kthread_work *work)
> {
> 	struct nvme_queue *nvmeq = container_of(work, struct nvme_queue,
> @@ -2638,6 +2690,11 @@ static int nvme_dev_start(struct nvme_dev *dev)
> 		goto disable;
> 	}
>
> +	/* Enable receive asynchronous event */
> +	result = nvme_enable_async_events(dev);
> +	if (result < 0 && result != -EBUSY)
> +		goto disable;
> +
> 	result = nvme_setup_io_queues(dev);
> 	if (result && result != -EBUSY)
> 		goto disable;

^ permalink raw reply	[flat|nested] 11+ messages in thread

* [PATCH] NVMe: Add support to receive NVMe asynchronous events
  2014-05-26 20:04 [PATCH] NVMe: Add support to receive NVMe asynchronous events Winson Yung (wyung)
  2014-05-26 21:42 ` Keith Busch
@ 2014-05-26 23:51 ` Matthew Wilcox
  2014-05-27  0:56   ` Keith Busch
  2014-05-27  5:15   ` Winson Yung (wyung)
  1 sibling, 2 replies; 11+ messages in thread
From: Matthew Wilcox @ 2014-05-26 23:51 UTC (permalink / raw)


On Mon, May 26, 2014@01:04:55PM -0700, Winson Yung (wyung) wrote:
> As a NVMe mandatory admin command, this driver should be setup so
> that it can receive drive critical asynchronous notification for
> issue such as device reliability, temperature above threshold, or
> available spare space fallen below threshould. This patch enables
> very basic mechanism to log the asynchronous events in kernel log.

Umm ... did you test this patch?

> Signed-off-by: Winson Yung <wyung at micron.com>
> ---
>  drivers/block/nvme-core.c |   57 +++++++++++++++++++++++++++++++++++++++++++++
>  1 file changed, 57 insertions(+)
> 
> diff --git a/drivers/block/nvme-core.c b/drivers/block/nvme-core.c
> index cd8a8bc7..4cd9f8e 100644
> --- a/drivers/block/nvme-core.c
> +++ b/drivers/block/nvme-core.c
> @@ -198,6 +198,7 @@ static int alloc_cmdid_killable(struct nvme_queue *nvmeq, void *ctx,
>  #define CMD_CTX_COMPLETED	(0x310 + CMD_CTX_BASE)
>  #define CMD_CTX_INVALID		(0x314 + CMD_CTX_BASE)
>  #define CMD_CTX_ABORT		(0x318 + CMD_CTX_BASE)
> +#define CMD_CTX_ASYNC_EVENT	(0x319 + CMD_CTX_BASE)

Please only use multiples of four; that is, 0x31c, not 0x319.  Also, these
are for use by 'special_completion', not 'async_completion'.

> +static int nvme_enable_async_events(struct nvme_dev *dev)
> +{
> +	int status, cmdid;
> +	u32 result, async_events;
> +	struct nvme_queue *adminq;
> +
> +	async_events = NVME_SMART_CRIT_SPARE |
> +			NVME_SMART_CRIT_TEMPERATURE |
> +			NVME_SMART_CRIT_RELIABILITY |
> +			NVME_SMART_CRIT_MEDIA |
> +			NVME_SMART_CRIT_VOLATILE_MEMORY;
> +
> +	status = nvme_set_features(dev, NVME_FEAT_ASYNC_EVENT,
> +					async_events, 0, &result);
> +
> +	if (status < 0)
> +		return status;
> +
> +	if (status > 0) {
> +		dev_err(&dev->pci_dev->dev, "Could not enable async event (%d)\n",
> +									status);
> +		return -EBUSY;
> +	}
> +
> +	adminq = rcu_dereference(dev->queues[0]);
> +
> +	/* Allocate a cmdid entry in preparation of next incoming async event */
> +	cmdid = alloc_cmdid(adminq, CMD_CTX_ASYNC_EVENT, async_completion, 0);
> +	return cmdid;
> +}

How is this supposed to work?  You've allocated a command ID, but you
haven't submitted an asynchronous event request command.  So how does
the controller know to use this command ID to report asynchronous events?

You should probably take a look at Keith's work last year to allow userspace
to send async event requests:

http://lists.infradead.org/pipermail/linux-nvme/2013-August/000350.html

^ permalink raw reply	[flat|nested] 11+ messages in thread

* [PATCH] NVMe: Add support to receive NVMe asynchronous events
  2014-05-26 23:51 ` Matthew Wilcox
@ 2014-05-27  0:56   ` Keith Busch
  2014-05-27  5:35     ` Winson Yung (wyung)
  2014-05-28 20:35     ` Winson Yung (wyung)
  2014-05-27  5:15   ` Winson Yung (wyung)
  1 sibling, 2 replies; 11+ messages in thread
From: Keith Busch @ 2014-05-27  0:56 UTC (permalink / raw)

On Mon, 26 May 2014, Matthew Wilcox wrote:
> You should probably take a look at Keith's work last year to allow userspace
> to send async event requests:
>
> http://lists.infradead.org/pipermail/linux-nvme/2013-August/000350.html

Yeah, that proposal just lets userspace consume the results of an async
request from a FIFO read through the character device. The driver still
has to do the sending since there's no mechanism for requests from user
space with infinite timeout.

I've no idea if the proposed method for consuming results of this kind
of information was typical. I assumed it wasn't since it didn't get much
traction. :)

^ permalink raw reply	[flat|nested] 11+ messages in thread

* [PATCH] NVMe: Add support to receive NVMe asynchronous events
  2014-05-26 21:42 ` Keith Busch
@ 2014-05-27  5:02   ` Winson Yung (wyung)
  0 siblings, 0 replies; 11+ messages in thread
From: Winson Yung (wyung) @ 2014-05-27  5:02 UTC (permalink / raw)


Thanks Keith for the feedback. I wasn't sure how to use the current code 
to receive async event. I see the code create a cmdid in order to send 
an admin cmd. The operation is either synchronous or asynchronous, but 
it is always expecting the cmd completion response in the end within a 
predetermined period.

For receiving async events, I thought to just create a completion queue 
entry after 'set feature' enabling the async event, I was assuming 
anytime when there is an async event, nvme_process_cq() will pick up the 
completion queue entry I created to store the event detail, and there 
was no timeout involved regardless what I passed in for 'timeout' when 
calling alloc_cmdid.

See my additional comments inline below

On 5/26/2014 2:42 PM, Keith Busch wrote:
> On Mon, 26 May 2014, Winson Yung (wyung) wrote:
>> As a NVMe mandatory admin command, this driver should be setup so
>> that it can receive drive critical asynchronous notification for
>> issue such as device reliability, temperature above threshold, or
>> available spare space fallen below threshould. This patch enables
>> very basic mechanism to log the asynchronous events in kernel log.
>>
>> Signed-off-by: Winson Yung <wyung at micron.com>
>> ---
>> drivers/block/nvme-core.c |   57 +++++++++++++++++++++++++++++++++++++++++++++
>> 1 file changed, 57 insertions(+)
>>
>> diff --git a/drivers/block/nvme-core.c b/drivers/block/nvme-core.c
>> index cd8a8bc7..4cd9f8e 100644
>> --- a/drivers/block/nvme-core.c
>> +++ b/drivers/block/nvme-core.c
>> @@ -198,6 +198,7 @@ static int alloc_cmdid_killable(struct nvme_queue *nvmeq, void *ctx,
>> #define CMD_CTX_COMPLETED	(0x310 + CMD_CTX_BASE)
>> #define CMD_CTX_INVALID		(0x314 + CMD_CTX_BASE)
>> #define CMD_CTX_ABORT		(0x318 + CMD_CTX_BASE)
>> +#define CMD_CTX_ASYNC_EVENT	(0x319 + CMD_CTX_BASE)
>
> Context needs to be dword aligned, so the next new context would be 0x31c.
>
thanks, I will fix the dword alignment definition problem

>> static void special_completion(struct nvme_queue *nvmeq, void *ctx,
>> 						struct nvme_completion *cqe)
>> @@ -227,7 +228,27 @@ static void special_completion(struct nvme_queue *nvmeq, void *ctx,
>> static void async_completion(struct nvme_queue *nvmeq, void *ctx,
>> 						struct nvme_completion *cqe)
>> {
>> +	int cmdid;
>> +	struct nvme_queue *adminq;
>> +	struct nvme_dev *dev = nvmeq->dev;
>> 	struct async_cmd_info *cmdinfo = ctx;
>> +
>> +	if (ctx == CMD_CTX_ASYNC_EVENT) {
>> +		dev_warn(nvmeq->q_dmadev, "An async event is detected (DW0:%X)\n",
>> +								cqe->result);
>> +
>> +		adminq = rcu_dereference(dev->queues[0]);
>> +
>> +		/* Allocate a cmdid entry for next async event */
>> +		cmdid = alloc_cmdid(adminq, CMD_CTX_ASYNC_EVENT,
>> +						async_completion, 0);
>
> You've allocated this new cmdid with no timeout, and then you do nothing
> with the command id. It's just going to get timed out.
>
The reason I did this way is because I assume I need to allocate an 
empty completion queue entry in preparation to receive an incoming async 
event in the future. It doesn't need to submit anything with this cmdid. 
That's why it didn't do anything with it, and there is no timeout 
needed. Maybe my understanding was wrong.

>> +		if (cmdid < 0)
>> +			dev_warn(nvmeq->q_dmadev,
>> +				"Failure creating new entry for next async event\n");
>> +
>> +		return; /* Report asynchronous critical event, and exit */
>> +	}
>> +
>> 	cmdinfo->result = le32_to_cpup(&cqe->result);
>> 	cmdinfo->status = le16_to_cpup(&cqe->status) >> 1;
>> 	queue_kthread_work(cmdinfo->worker, &cmdinfo->work);
>> @@ -2381,6 +2402,37 @@ static int nvme_delete_cq(struct nvme_queue *nvmeq)
>> 						nvme_del_cq_work_handler);
>> }
>>
>> +static int nvme_enable_async_events(struct nvme_dev *dev)
>> +{
>> +	int status, cmdid;
>> +	u32 result, async_events;
>> +	struct nvme_queue *adminq;
>> +
>> +	async_events = NVME_SMART_CRIT_SPARE |
>> +			NVME_SMART_CRIT_TEMPERATURE |
>> +			NVME_SMART_CRIT_RELIABILITY |
>> +			NVME_SMART_CRIT_MEDIA |
>> +			NVME_SMART_CRIT_VOLATILE_MEMORY;
>> +
>> +	status = nvme_set_features(dev, NVME_FEAT_ASYNC_EVENT,
>> +					async_events, 0, &result);
>
> I think we'd rather let the user pick what events they want to see using
> the passthrough IOCTL rather than have the driver decide these things.

Good idea, I think a sysfs might be better, do you have objection use 
that instead.

>
>> +
>> +	if (status < 0)
>> +		return status;
>> +
>> +	if (status > 0) {
>> +		dev_err(&dev->pci_dev->dev, "Could not enable async event (%d)\n",
>> +									status);
>> +		return -EBUSY;
>> +	}
>> +
>> +	adminq = rcu_dereference(dev->queues[0]);
>> +
>> +	/* Allocate a cmdid entry in preparation of next incoming async event */
>> +	cmdid = alloc_cmdid(adminq, CMD_CTX_ASYNC_EVENT, async_completion, 0);
>
> Same thing as in the completion, you're allocating a cmdid, but no
> command is associated with it.

Ditto here, I knew this will probably require some rework. The basic 
difference between an asynchronous event and regular admin cmd is that 
async event doesn't have a timeout, it can come any time after host 
issues enabling the async event feature, whereas a normal admin cmd will 
get some sort of completion response within certain timeout period.

>
> I don't think you want to use the "async_completion" callback either
> (is it confusing to name that callback that way? :)) unless you have
> some deferred work that needs to be done upon the completion that can't
> be done in interrupt context.
>

I can change to use a different callback name. But using alloc_cmdid 
with a zero timeout and callback may not be the right way for async 
event. Any suggestion is welcome.

>> +	return cmdid;
>> +}
>> +
>> static void nvme_del_sq_work_handler(struct kthread_work *work)
>> {
>> 	struct nvme_queue *nvmeq = container_of(work, struct nvme_queue,
>> @@ -2638,6 +2690,11 @@ static int nvme_dev_start(struct nvme_dev *dev)
>> 		goto disable;
>> 	}
>>
>> +	/* Enable receive asynchronous event */
>> +	result = nvme_enable_async_events(dev);
>> +	if (result < 0 && result != -EBUSY)
>> +		goto disable;
>> +
>> 	result = nvme_setup_io_queues(dev);
>> 	if (result && result != -EBUSY)
>> 		goto disable;

^ permalink raw reply	[flat|nested] 11+ messages in thread

* [PATCH] NVMe: Add support to receive NVMe asynchronous events
  2014-05-26 23:51 ` Matthew Wilcox
  2014-05-27  0:56   ` Keith Busch
@ 2014-05-27  5:15   ` Winson Yung (wyung)
  1 sibling, 0 replies; 11+ messages in thread
From: Winson Yung (wyung) @ 2014-05-27  5:15 UTC (permalink / raw)


On 5/26/2014 4:51 PM, Matthew Wilcox wrote:
> On Mon, May 26, 2014@01:04:55PM -0700, Winson Yung (wyung) wrote:
>> As a NVMe mandatory admin command, this driver should be setup so
>> that it can receive drive critical asynchronous notification for
>> issue such as device reliability, temperature above threshold, or
>> available spare space fallen below threshould. This patch enables
>> very basic mechanism to log the asynchronous events in kernel log.
>
> Umm ... did you test this patch?

I didn't have the time to test the patch yet, perhaps I should mark this 
patch as RFC instead. But yes, I will try to verify when I have a system 
setup.

>
>> Signed-off-by: Winson Yung <wyung at micron.com>
>> ---
>>   drivers/block/nvme-core.c |   57 +++++++++++++++++++++++++++++++++++++++++++++
>>   1 file changed, 57 insertions(+)
>>
>> diff --git a/drivers/block/nvme-core.c b/drivers/block/nvme-core.c
>> index cd8a8bc7..4cd9f8e 100644
>> --- a/drivers/block/nvme-core.c
>> +++ b/drivers/block/nvme-core.c
>> @@ -198,6 +198,7 @@ static int alloc_cmdid_killable(struct nvme_queue *nvmeq, void *ctx,
>>   #define CMD_CTX_COMPLETED	(0x310 + CMD_CTX_BASE)
>>   #define CMD_CTX_INVALID		(0x314 + CMD_CTX_BASE)
>>   #define CMD_CTX_ABORT		(0x318 + CMD_CTX_BASE)
>> +#define CMD_CTX_ASYNC_EVENT	(0x319 + CMD_CTX_BASE)
>
> Please only use multiples of four; that is, 0x31c, not 0x319.  Also, these
> are for use by 'special_completion', not 'async_completion'.
>

Understood about the multiple of four thingy, I will fix it. I will 
change the name to avoid confusion if I can still use async_completion.

>> +static int nvme_enable_async_events(struct nvme_dev *dev)
>> +{
>> +	int status, cmdid;
>> +	u32 result, async_events;
>> +	struct nvme_queue *adminq;
>> +
>> +	async_events = NVME_SMART_CRIT_SPARE |
>> +			NVME_SMART_CRIT_TEMPERATURE |
>> +			NVME_SMART_CRIT_RELIABILITY |
>> +			NVME_SMART_CRIT_MEDIA |
>> +			NVME_SMART_CRIT_VOLATILE_MEMORY;
>> +
>> +	status = nvme_set_features(dev, NVME_FEAT_ASYNC_EVENT,
>> +					async_events, 0, &result);
>> +
>> +	if (status < 0)
>> +		return status;
>> +
>> +	if (status > 0) {
>> +		dev_err(&dev->pci_dev->dev, "Could not enable async event (%d)\n",
>> +									status);
>> +		return -EBUSY;
>> +	}
>> +
>> +	adminq = rcu_dereference(dev->queues[0]);
>> +
>> +	/* Allocate a cmdid entry in preparation of next incoming async event */
>> +	cmdid = alloc_cmdid(adminq, CMD_CTX_ASYNC_EVENT, async_completion, 0);
>> +	return cmdid;
>> +}
>
> How is this supposed to work?  You've allocated a command ID, but you
> haven't submitted an asynchronous event request command.  So how does
> the controller know to use this command ID to report asynchronous events?
>

Please see my reply to Keith's email, perhaps my assumption was wrong.

> You should probably take a look at Keith's work last year to allow userspace
> to send async event requests:
>
> http://lists.infradead.org/pipermail/linux-nvme/2013-August/000350.html
>

Thanks for the link, I wasn't aware of that. I will take a look.

^ permalink raw reply	[flat|nested] 11+ messages in thread

* [PATCH] NVMe: Add support to receive NVMe asynchronous events
  2014-05-27  0:56   ` Keith Busch
@ 2014-05-27  5:35     ` Winson Yung (wyung)
  2014-05-27  5:50       ` Keith Busch
  2014-05-28 20:35     ` Winson Yung (wyung)
  1 sibling, 1 reply; 11+ messages in thread
From: Winson Yung (wyung) @ 2014-05-27  5:35 UTC (permalink / raw)



Keith, I do see a need to enable async event in the NVMe kernel driver. 
For example, when there is a temperature above threshold, driver can 
take an action (by telling firmware) to lower down operating frequency, 
or throttle IO request to protect drive from premature over heat damage.

/Winson

On 5/26/2014 5:56 PM, Keith Busch wrote:
> On Mon, 26 May 2014, Matthew Wilcox wrote:
>> You should probably take a look at Keith's work last year to allow userspace
>> to send async event requests:
>>
>> http://lists.infradead.org/pipermail/linux-nvme/2013-August/000350.html
>
> Yeah, that proposal just lets userspace consume the results of an async
> request from a FIFO read through the character device. The driver still
> has to do the sending since there's no mechanism for requests from user
> space with infinite timeout.
>
> I've no idea if the proposed method for consuming results of this kind
> of information was typical. I assumed it wasn't since it didn't get much
> traction. :)
>

^ permalink raw reply	[flat|nested] 11+ messages in thread

* [PATCH] NVMe: Add support to receive NVMe asynchronous events
  2014-05-27  5:35     ` Winson Yung (wyung)
@ 2014-05-27  5:50       ` Keith Busch
  2014-05-27  6:56         ` Robles, Raymond C
  0 siblings, 1 reply; 11+ messages in thread
From: Keith Busch @ 2014-05-27  5:50 UTC (permalink / raw)

On Mon, 26 May 2014, Winson Yung (wyung) wrote:
> Keith, I do see a need to enable async event in the NVMe kernel driver. For 
> example, when there is a temperature above threshold, driver can take an 
> action (by telling firmware) to lower down operating frequency, or throttle 
> IO request to protect drive from premature over heat damage.

This is sounding specific to your environment. What's a good policy
for yours might not be a good policy for mine. Why would I want the
driver to throttle frequency when I have better environmental control
options available? The right thing to do, IMHO, is make all information
available to a user space app and provide a way for it to control the
device according to a policy it knows.

^ permalink raw reply	[flat|nested] 11+ messages in thread

* [PATCH] NVMe: Add support to receive NVMe asynchronous events
  2014-05-27  5:50       ` Keith Busch
@ 2014-05-27  6:56         ` Robles, Raymond C
  0 siblings, 0 replies; 11+ messages in thread
From: Robles, Raymond C @ 2014-05-27  6:56 UTC (permalink / raw)

This is exactly what the Windows OFA NVMe open source driver does as well. The driver does not, and should not, have knowledge as to what the "right temperature threshold" is or how many "I/O to throttle" in any kind of situation, good or bad. The NVMe device/controller parameters and policy should be set and handled (proactively and reactively) by the device vendor and any 3rd party user space application, either from the vendor or some other trusted OEM source. 

-----Original Message-----
From: Linux-nvme [mailto:linux-nvme-bounces@lists.infradead.org] On Behalf Of Keith Busch
Sent: Monday, May 26, 2014 10:51 PM
To: Winson Yung (wyung)
Cc: Busch, Keith; Matthew Wilcox; linux-nvme at lists.infradead.org
Subject: Re: [PATCH] NVMe: Add support to receive NVMe asynchronous events

On Mon, 26 May 2014, Winson Yung (wyung) wrote:
> Keith, I do see a need to enable async event in the NVMe kernel 
> driver. For example, when there is a temperature above threshold, 
> driver can take an action (by telling firmware) to lower down 
> operating frequency, or throttle IO request to protect drive from premature over heat damage.

This is sounding specific to your environment. What's a good policy for yours might not be a good policy for mine. Why would I want the driver to throttle frequency when I have better environmental control options available? The right thing to do, IMHO, is make all information available to a user space app and provide a way for it to control the device according to a policy it knows.

_______________________________________________
Linux-nvme mailing list
Linux-nvme at lists.infradead.org
http://lists.infradead.org/mailman/listinfo/linux-nvme

^ permalink raw reply	[flat|nested] 11+ messages in thread

* [PATCH] NVMe: Add support to receive NVMe asynchronous events
  2014-05-27  0:56   ` Keith Busch
  2014-05-27  5:35     ` Winson Yung (wyung)
@ 2014-05-28 20:35     ` Winson Yung (wyung)
  2014-05-29  6:40       ` Keith Busch
  1 sibling, 1 reply; 11+ messages in thread
From: Winson Yung (wyung) @ 2014-05-28 20:35 UTC (permalink / raw)


I had a look of the patch, it looks it does what I was trying to enable, 
except it misses the portion that enables it by calling set feature cmd. 
Is it something we can consider now? Also, for these critical warnings 
that exposed by the async events, can we also put them in the kernel log 
as well when they enabled?

/Winson

On 5/26/2014 5:56 PM, Keith Busch wrote:
> On Mon, 26 May 2014, Matthew Wilcox wrote:
>> You should probably take a look at Keith's work last year to allow userspace
>> to send async event requests:
>>
>> http://lists.infradead.org/pipermail/linux-nvme/2013-August/000350.html
>
> Yeah, that proposal just lets userspace consume the results of an async
> request from a FIFO read through the character device. The driver still
> has to do the sending since there's no mechanism for requests from user
> space with infinite timeout.
>
> I've no idea if the proposed method for consuming results of this kind
> of information was typical. I assumed it wasn't since it didn't get much
> traction. :)
>

^ permalink raw reply	[flat|nested] 11+ messages in thread

* [PATCH] NVMe: Add support to receive NVMe asynchronous events
  2014-05-28 20:35     ` Winson Yung (wyung)
@ 2014-05-29  6:40       ` Keith Busch
  0 siblings, 0 replies; 11+ messages in thread
From: Keith Busch @ 2014-05-29  6:40 UTC (permalink / raw)


On Wed, 28 May 2014, Winson Yung (wyung) wrote:
> I had a look of the patch, it looks it does what I was trying to enable, 
> except it misses the portion that enables it by calling set feature cmd. Is 
> it something we can consider now? Also, for these critical warnings that 
> exposed by the async events, can we also put them in the kernel log as well 
> when they enabled?

I thought we agreed it's best to let the user space do the set features
so it gets to decide what events it wants to see.

I don't have a strong opinion on how to present events to the user. Maybe
just print them to the kernel log and be done with it.

^ permalink raw reply	[flat|nested] 11+ messages in thread

end of thread, other threads:[~2014-05-29  6:40 UTC | newest]

Thread overview: 11+ messages (download: mbox.gz follow: Atom feed
-- links below jump to the message on this page --
2014-05-26 20:04 [PATCH] NVMe: Add support to receive NVMe asynchronous events Winson Yung (wyung)
2014-05-26 21:42 ` Keith Busch
2014-05-27  5:02   ` Winson Yung (wyung)
2014-05-26 23:51 ` Matthew Wilcox
2014-05-27  0:56   ` Keith Busch
2014-05-27  5:35     ` Winson Yung (wyung)
2014-05-27  5:50       ` Keith Busch
2014-05-27  6:56         ` Robles, Raymond C
2014-05-28 20:35     ` Winson Yung (wyung)
2014-05-29  6:40       ` Keith Busch
2014-05-27  5:15   ` Winson Yung (wyung)

This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox