* [PATCH v13 1/4] PCI/DOE: Rename DOE protocol to feature
@ 2024-07-02 6:04 Alistair Francis
2024-07-02 6:04 ` [PATCH v13 2/4] PCI/DOE: Rename Discovery Response Data Object Contents to type Alistair Francis
` (2 more replies)
0 siblings, 3 replies; 10+ messages in thread
From: Alistair Francis @ 2024-07-02 6:04 UTC (permalink / raw)
To: bhelgaas, linux-pci, Jonathan.Cameron, lukas
Cc: alex.williamson, christian.koenig, kch, gregkh, logang,
linux-kernel, alistair23, chaitanyak, rdunlap, Alistair Francis
DOE r1.1 replaced all occurrences of "protocol" with the term "feature"
or "Data Object Type".
PCIe r6.1 (which was published July 24) incorporated that change.
Rename the existing terms protocol with feature.
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
Reviewed-by: Jonathan Cameron <Jonathan.Cameron@huawei.com>
Reviewed-by: Lukas Wunner <lukas@wunner.de>
---
v13:
- No changes
v12:
- No changes
v11:
- No changes
v10:
- Split original patch into two
v9:
- Rename two more DOE macros
v8:
- Rename prot to feat as well
v7:
- Initial patch
drivers/pci/doe.c | 88 +++++++++++++++++++++++------------------------
1 file changed, 44 insertions(+), 44 deletions(-)
diff --git a/drivers/pci/doe.c b/drivers/pci/doe.c
index 652d63df9d22..f776f5304a3e 100644
--- a/drivers/pci/doe.c
+++ b/drivers/pci/doe.c
@@ -22,7 +22,7 @@
#include "pci.h"
-#define PCI_DOE_PROTOCOL_DISCOVERY 0
+#define PCI_DOE_FEATURE_DISCOVERY 0
/* Timeout of 1 second from 6.30.2 Operation, PCI Spec r6.0 */
#define PCI_DOE_TIMEOUT HZ
@@ -43,7 +43,7 @@
*
* @pdev: PCI device this mailbox belongs to
* @cap_offset: Capability offset
- * @prots: Array of protocols supported (encoded as long values)
+ * @feats: Array of features supported (encoded as long values)
* @wq: Wait queue for work item
* @work_queue: Queue of pci_doe_work items
* @flags: Bit array of PCI_DOE_FLAG_* flags
@@ -51,14 +51,14 @@
struct pci_doe_mb {
struct pci_dev *pdev;
u16 cap_offset;
- struct xarray prots;
+ struct xarray feats;
wait_queue_head_t wq;
struct workqueue_struct *work_queue;
unsigned long flags;
};
-struct pci_doe_protocol {
+struct pci_doe_feature {
u16 vid;
u8 type;
};
@@ -66,7 +66,7 @@ struct pci_doe_protocol {
/**
* struct pci_doe_task - represents a single query/response
*
- * @prot: DOE Protocol
+ * @feat: DOE Feature
* @request_pl: The request payload
* @request_pl_sz: Size of the request payload (bytes)
* @response_pl: The response payload
@@ -78,7 +78,7 @@ struct pci_doe_protocol {
* @doe_mb: Used internally by the mailbox
*/
struct pci_doe_task {
- struct pci_doe_protocol prot;
+ struct pci_doe_feature feat;
const __le32 *request_pl;
size_t request_pl_sz;
__le32 *response_pl;
@@ -171,8 +171,8 @@ static int pci_doe_send_req(struct pci_doe_mb *doe_mb,
length = 0;
/* Write DOE Header */
- val = FIELD_PREP(PCI_DOE_DATA_OBJECT_HEADER_1_VID, task->prot.vid) |
- FIELD_PREP(PCI_DOE_DATA_OBJECT_HEADER_1_TYPE, task->prot.type);
+ val = FIELD_PREP(PCI_DOE_DATA_OBJECT_HEADER_1_VID, task->feat.vid) |
+ FIELD_PREP(PCI_DOE_DATA_OBJECT_HEADER_1_TYPE, task->feat.type);
pci_write_config_dword(pdev, offset + PCI_DOE_WRITE, val);
pci_write_config_dword(pdev, offset + PCI_DOE_WRITE,
FIELD_PREP(PCI_DOE_DATA_OBJECT_HEADER_2_LENGTH,
@@ -217,12 +217,12 @@ static int pci_doe_recv_resp(struct pci_doe_mb *doe_mb, struct pci_doe_task *tas
int i = 0;
u32 val;
- /* Read the first dword to get the protocol */
+ /* Read the first dword to get the feature */
pci_read_config_dword(pdev, offset + PCI_DOE_READ, &val);
- if ((FIELD_GET(PCI_DOE_DATA_OBJECT_HEADER_1_VID, val) != task->prot.vid) ||
- (FIELD_GET(PCI_DOE_DATA_OBJECT_HEADER_1_TYPE, val) != task->prot.type)) {
- dev_err_ratelimited(&pdev->dev, "[%x] expected [VID, Protocol] = [%04x, %02x], got [%04x, %02x]\n",
- doe_mb->cap_offset, task->prot.vid, task->prot.type,
+ if ((FIELD_GET(PCI_DOE_DATA_OBJECT_HEADER_1_VID, val) != task->feat.vid) ||
+ (FIELD_GET(PCI_DOE_DATA_OBJECT_HEADER_1_TYPE, val) != task->feat.type)) {
+ dev_err_ratelimited(&pdev->dev, "[%x] expected [VID, Feature] = [%04x, %02x], got [%04x, %02x]\n",
+ doe_mb->cap_offset, task->feat.vid, task->feat.type,
FIELD_GET(PCI_DOE_DATA_OBJECT_HEADER_1_VID, val),
FIELD_GET(PCI_DOE_DATA_OBJECT_HEADER_1_TYPE, val));
return -EIO;
@@ -384,7 +384,7 @@ static void pci_doe_task_complete(struct pci_doe_task *task)
}
static int pci_doe_discovery(struct pci_doe_mb *doe_mb, u8 capver, u8 *index, u16 *vid,
- u8 *protocol)
+ u8 *feature)
{
u32 request_pl = FIELD_PREP(PCI_DOE_DATA_OBJECT_DISC_REQ_3_INDEX,
*index) |
@@ -395,7 +395,7 @@ static int pci_doe_discovery(struct pci_doe_mb *doe_mb, u8 capver, u8 *index, u1
u32 response_pl;
int rc;
- rc = pci_doe(doe_mb, PCI_VENDOR_ID_PCI_SIG, PCI_DOE_PROTOCOL_DISCOVERY,
+ rc = pci_doe(doe_mb, PCI_VENDOR_ID_PCI_SIG, PCI_DOE_FEATURE_DISCOVERY,
&request_pl_le, sizeof(request_pl_le),
&response_pl_le, sizeof(response_pl_le));
if (rc < 0)
@@ -406,7 +406,7 @@ static int pci_doe_discovery(struct pci_doe_mb *doe_mb, u8 capver, u8 *index, u1
response_pl = le32_to_cpu(response_pl_le);
*vid = FIELD_GET(PCI_DOE_DATA_OBJECT_DISC_RSP_3_VID, response_pl);
- *protocol = FIELD_GET(PCI_DOE_DATA_OBJECT_DISC_RSP_3_PROTOCOL,
+ *feature = FIELD_GET(PCI_DOE_DATA_OBJECT_DISC_RSP_3_PROTOCOL,
response_pl);
*index = FIELD_GET(PCI_DOE_DATA_OBJECT_DISC_RSP_3_NEXT_INDEX,
response_pl);
@@ -414,12 +414,12 @@ static int pci_doe_discovery(struct pci_doe_mb *doe_mb, u8 capver, u8 *index, u1
return 0;
}
-static void *pci_doe_xa_prot_entry(u16 vid, u8 prot)
+static void *pci_doe_xa_feat_entry(u16 vid, u8 prot)
{
return xa_mk_value((vid << 8) | prot);
}
-static int pci_doe_cache_protocols(struct pci_doe_mb *doe_mb)
+static int pci_doe_cache_features(struct pci_doe_mb *doe_mb)
{
u8 index = 0;
u8 xa_idx = 0;
@@ -438,11 +438,11 @@ static int pci_doe_cache_protocols(struct pci_doe_mb *doe_mb)
return rc;
pci_dbg(doe_mb->pdev,
- "[%x] Found protocol %d vid: %x prot: %x\n",
+ "[%x] Found feature %d vid: %x prot: %x\n",
doe_mb->cap_offset, xa_idx, vid, prot);
- rc = xa_insert(&doe_mb->prots, xa_idx++,
- pci_doe_xa_prot_entry(vid, prot), GFP_KERNEL);
+ rc = xa_insert(&doe_mb->feats, xa_idx++,
+ pci_doe_xa_feat_entry(vid, prot), GFP_KERNEL);
if (rc)
return rc;
} while (index);
@@ -466,7 +466,7 @@ static void pci_doe_cancel_tasks(struct pci_doe_mb *doe_mb)
* @pdev: PCI device to create the DOE mailbox for
* @cap_offset: Offset of the DOE mailbox
*
- * Create a single mailbox object to manage the mailbox protocol at the
+ * Create a single mailbox object to manage the mailbox feature at the
* cap_offset specified.
*
* RETURNS: created mailbox object on success
@@ -485,7 +485,7 @@ static struct pci_doe_mb *pci_doe_create_mb(struct pci_dev *pdev,
doe_mb->pdev = pdev;
doe_mb->cap_offset = cap_offset;
init_waitqueue_head(&doe_mb->wq);
- xa_init(&doe_mb->prots);
+ xa_init(&doe_mb->feats);
doe_mb->work_queue = alloc_ordered_workqueue("%s %s DOE [%x]", 0,
dev_bus_name(&pdev->dev),
@@ -508,11 +508,11 @@ static struct pci_doe_mb *pci_doe_create_mb(struct pci_dev *pdev,
/*
* The state machine and the mailbox should be in sync now;
- * Use the mailbox to query protocols.
+ * Use the mailbox to query features.
*/
- rc = pci_doe_cache_protocols(doe_mb);
+ rc = pci_doe_cache_features(doe_mb);
if (rc) {
- pci_err(pdev, "[%x] failed to cache protocols : %d\n",
+ pci_err(pdev, "[%x] failed to cache features : %d\n",
doe_mb->cap_offset, rc);
goto err_cancel;
}
@@ -521,7 +521,7 @@ static struct pci_doe_mb *pci_doe_create_mb(struct pci_dev *pdev,
err_cancel:
pci_doe_cancel_tasks(doe_mb);
- xa_destroy(&doe_mb->prots);
+ xa_destroy(&doe_mb->feats);
err_destroy_wq:
destroy_workqueue(doe_mb->work_queue);
err_free:
@@ -539,31 +539,31 @@ static struct pci_doe_mb *pci_doe_create_mb(struct pci_dev *pdev,
static void pci_doe_destroy_mb(struct pci_doe_mb *doe_mb)
{
pci_doe_cancel_tasks(doe_mb);
- xa_destroy(&doe_mb->prots);
+ xa_destroy(&doe_mb->feats);
destroy_workqueue(doe_mb->work_queue);
kfree(doe_mb);
}
/**
- * pci_doe_supports_prot() - Return if the DOE instance supports the given
- * protocol
+ * pci_doe_supports_feat() - Return if the DOE instance supports the given
+ * feature
* @doe_mb: DOE mailbox capability to query
- * @vid: Protocol Vendor ID
- * @type: Protocol type
+ * @vid: Feature Vendor ID
+ * @type: Feature type
*
- * RETURNS: True if the DOE mailbox supports the protocol specified
+ * RETURNS: True if the DOE mailbox supports the feature specified
*/
-static bool pci_doe_supports_prot(struct pci_doe_mb *doe_mb, u16 vid, u8 type)
+static bool pci_doe_supports_feat(struct pci_doe_mb *doe_mb, u16 vid, u8 type)
{
unsigned long index;
void *entry;
- /* The discovery protocol must always be supported */
- if (vid == PCI_VENDOR_ID_PCI_SIG && type == PCI_DOE_PROTOCOL_DISCOVERY)
+ /* The discovery feature must always be supported */
+ if (vid == PCI_VENDOR_ID_PCI_SIG && type == PCI_DOE_FEATURE_DISCOVERY)
return true;
- xa_for_each(&doe_mb->prots, index, entry)
- if (entry == pci_doe_xa_prot_entry(vid, type))
+ xa_for_each(&doe_mb->feats, index, entry)
+ if (entry == pci_doe_xa_feat_entry(vid, type))
return true;
return false;
@@ -591,7 +591,7 @@ static bool pci_doe_supports_prot(struct pci_doe_mb *doe_mb, u16 vid, u8 type)
static int pci_doe_submit_task(struct pci_doe_mb *doe_mb,
struct pci_doe_task *task)
{
- if (!pci_doe_supports_prot(doe_mb, task->prot.vid, task->prot.type))
+ if (!pci_doe_supports_feat(doe_mb, task->feat.vid, task->feat.type))
return -EINVAL;
if (test_bit(PCI_DOE_FLAG_DEAD, &doe_mb->flags))
@@ -637,8 +637,8 @@ int pci_doe(struct pci_doe_mb *doe_mb, u16 vendor, u8 type,
{
DECLARE_COMPLETION_ONSTACK(c);
struct pci_doe_task task = {
- .prot.vid = vendor,
- .prot.type = type,
+ .feat.vid = vendor,
+ .feat.type = type,
.request_pl = request,
.request_pl_sz = request_sz,
.response_pl = response,
@@ -663,9 +663,9 @@ EXPORT_SYMBOL_GPL(pci_doe);
*
* @pdev: PCI device
* @vendor: Vendor ID
- * @type: Data Object Type
+ * @prot: Data Object Type
*
- * Find first DOE mailbox of a PCI device which supports the given protocol.
+ * Find first DOE mailbox of a PCI device which supports the given feature.
*
* RETURNS: Pointer to the DOE mailbox or NULL if none was found.
*/
@@ -676,7 +676,7 @@ struct pci_doe_mb *pci_find_doe_mailbox(struct pci_dev *pdev, u16 vendor,
unsigned long index;
xa_for_each(&pdev->doe_mbs, index, doe_mb)
- if (pci_doe_supports_prot(doe_mb, vendor, type))
+ if (pci_doe_supports_feat(doe_mb, vendor, type))
return doe_mb;
return NULL;
--
2.45.2
^ permalink raw reply related [flat|nested] 10+ messages in thread
* [PATCH v13 2/4] PCI/DOE: Rename Discovery Response Data Object Contents to type
2024-07-02 6:04 [PATCH v13 1/4] PCI/DOE: Rename DOE protocol to feature Alistair Francis
@ 2024-07-02 6:04 ` Alistair Francis
2024-07-02 6:04 ` [PATCH v13 3/4] PCI/DOE: Expose the DOE features via sysfs Alistair Francis
2024-07-02 6:04 ` [PATCH v13 4/4] PCI/DOE: Allow enabling DOE without CXL Alistair Francis
2 siblings, 0 replies; 10+ messages in thread
From: Alistair Francis @ 2024-07-02 6:04 UTC (permalink / raw)
To: bhelgaas, linux-pci, Jonathan.Cameron, lukas
Cc: alex.williamson, christian.koenig, kch, gregkh, logang,
linux-kernel, alistair23, chaitanyak, rdunlap, Alistair Francis
PCIe r6.1 (which was published July 24) describes a "Vendor ID", a
"Data Object Type" and "Next Index" as the fields in the DOE
Discovery Response Data Object. The DOE driver currently uses
both the terms type and prot for the second element.
This patch renames all uses of the DOE Discovery Response Data Object
to use type as the second element of the object header, instead of
type/prot as it currently is.
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
Reviewed-by: Jonathan Cameron <Jonathan.Cameron@huawei.com>
---
v13
- No changes
v12:
- Use PCI_DOE_DATA_OBJECT_DISC_RSP_3_TYPE for PCI_DOE_DATA_OBJECT_DISC_RSP_3_PROTOCOL
v11:
- Avoid breaking changes to userspace header
v10:
- Split original patch into two
v9:
- Rename two more DOE macros
v8:
- Rename prot to feat as well
v7:
- Initial patch
drivers/pci/doe.c | 18 +++++++++---------
include/uapi/linux/pci_regs.h | 5 ++++-
2 files changed, 13 insertions(+), 10 deletions(-)
diff --git a/drivers/pci/doe.c b/drivers/pci/doe.c
index f776f5304a3e..defc4be81bd4 100644
--- a/drivers/pci/doe.c
+++ b/drivers/pci/doe.c
@@ -406,7 +406,7 @@ static int pci_doe_discovery(struct pci_doe_mb *doe_mb, u8 capver, u8 *index, u1
response_pl = le32_to_cpu(response_pl_le);
*vid = FIELD_GET(PCI_DOE_DATA_OBJECT_DISC_RSP_3_VID, response_pl);
- *feature = FIELD_GET(PCI_DOE_DATA_OBJECT_DISC_RSP_3_PROTOCOL,
+ *feature = FIELD_GET(PCI_DOE_DATA_OBJECT_DISC_RSP_3_TYPE,
response_pl);
*index = FIELD_GET(PCI_DOE_DATA_OBJECT_DISC_RSP_3_NEXT_INDEX,
response_pl);
@@ -414,9 +414,9 @@ static int pci_doe_discovery(struct pci_doe_mb *doe_mb, u8 capver, u8 *index, u1
return 0;
}
-static void *pci_doe_xa_feat_entry(u16 vid, u8 prot)
+static void *pci_doe_xa_feat_entry(u16 vid, u8 type)
{
- return xa_mk_value((vid << 8) | prot);
+ return xa_mk_value((vid << 8) | type);
}
static int pci_doe_cache_features(struct pci_doe_mb *doe_mb)
@@ -430,19 +430,19 @@ static int pci_doe_cache_features(struct pci_doe_mb *doe_mb)
do {
int rc;
u16 vid;
- u8 prot;
+ u8 type;
rc = pci_doe_discovery(doe_mb, PCI_EXT_CAP_VER(hdr), &index,
- &vid, &prot);
+ &vid, &type);
if (rc)
return rc;
pci_dbg(doe_mb->pdev,
- "[%x] Found feature %d vid: %x prot: %x\n",
- doe_mb->cap_offset, xa_idx, vid, prot);
+ "[%x] Found feature %d vid: %x type: %x\n",
+ doe_mb->cap_offset, xa_idx, vid, type);
rc = xa_insert(&doe_mb->feats, xa_idx++,
- pci_doe_xa_feat_entry(vid, prot), GFP_KERNEL);
+ pci_doe_xa_feat_entry(vid, type), GFP_KERNEL);
if (rc)
return rc;
} while (index);
@@ -663,7 +663,7 @@ EXPORT_SYMBOL_GPL(pci_doe);
*
* @pdev: PCI device
* @vendor: Vendor ID
- * @prot: Data Object Type
+ * @type: Data Object Type
*
* Find first DOE mailbox of a PCI device which supports the given feature.
*
diff --git a/include/uapi/linux/pci_regs.h b/include/uapi/linux/pci_regs.h
index 94c00996e633..795e49304ae4 100644
--- a/include/uapi/linux/pci_regs.h
+++ b/include/uapi/linux/pci_regs.h
@@ -1146,9 +1146,12 @@
#define PCI_DOE_DATA_OBJECT_DISC_REQ_3_INDEX 0x000000ff
#define PCI_DOE_DATA_OBJECT_DISC_REQ_3_VER 0x0000ff00
#define PCI_DOE_DATA_OBJECT_DISC_RSP_3_VID 0x0000ffff
-#define PCI_DOE_DATA_OBJECT_DISC_RSP_3_PROTOCOL 0x00ff0000
+#define PCI_DOE_DATA_OBJECT_DISC_RSP_3_TYPE 0x00ff0000
#define PCI_DOE_DATA_OBJECT_DISC_RSP_3_NEXT_INDEX 0xff000000
+/* Deprecated old name, replaced with PCI_DOE_DATA_OBJECT_DISC_RSP_3_TYPE */
+#define PCI_DOE_DATA_OBJECT_DISC_RSP_3_PROTOCOL PCI_DOE_DATA_OBJECT_DISC_RSP_3_TYPE
+
/* Compute Express Link (CXL r3.1, sec 8.1.5) */
#define PCI_DVSEC_CXL_PORT 3
#define PCI_DVSEC_CXL_PORT_CTL 0x0c
--
2.45.2
^ permalink raw reply related [flat|nested] 10+ messages in thread
* [PATCH v13 3/4] PCI/DOE: Expose the DOE features via sysfs
2024-07-02 6:04 [PATCH v13 1/4] PCI/DOE: Rename DOE protocol to feature Alistair Francis
2024-07-02 6:04 ` [PATCH v13 2/4] PCI/DOE: Rename Discovery Response Data Object Contents to type Alistair Francis
@ 2024-07-02 6:04 ` Alistair Francis
2024-07-02 11:57 ` Chaitanya Kulkarni
2024-07-02 13:58 ` Jonathan Cameron
2024-07-02 6:04 ` [PATCH v13 4/4] PCI/DOE: Allow enabling DOE without CXL Alistair Francis
2 siblings, 2 replies; 10+ messages in thread
From: Alistair Francis @ 2024-07-02 6:04 UTC (permalink / raw)
To: bhelgaas, linux-pci, Jonathan.Cameron, lukas
Cc: alex.williamson, christian.koenig, kch, gregkh, logang,
linux-kernel, alistair23, chaitanyak, rdunlap, Alistair Francis
The PCIe 6 specification added support for the Data Object
Exchange (DOE).
When DOE is supported the DOE Discovery Feature must be implemented per
PCIe r6.1 sec 6.30.1.1. The protocol allows a requester to obtain
information about the other DOE features supported by the device.
The kernel is already querying the DOE features supported and cacheing
the values. Expose the values in sysfs to allow user space to
determine which DOE features are supported by the PCIe device.
By exposing the information to userspace tools like lspci can relay the
information to users. By listing all of the supported features we can
allow userspace to parse the list, which might include
vendor specific features as well as yet to be supported features.
After this patch is supported you can see something like this when
attaching a DOE device
$ ls /sys/devices/pci0000:00/0000:00:02.0//doe*
0001:00 0001:01 0001:02
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
---
v13:
- Drop pci_doe_sysfs_init() and use pci_doe_sysfs_group
- As discussed in https://lore.kernel.org/all/20231019165829.GA1381099@bhelgaas/
we can just modify pci_doe_sysfs_group at the DOE init and let
device_add() handle the sysfs attributes.
v12:
- Drop pci_doe_features_sysfs_attr_visible()
v11:
- Gracefully handle multiple entried of same feature
- Minor fixes and code cleanups
v10:
- Rebase to use DEFINE_SYSFS_GROUP_VISIBLE and remove
special setup function
v9:
- Add a teardown function
- Rename functions to be clearer
- Tidy up the commit message
- Remove #ifdef from header
v8:
- Inlucde an example in the docs
- Fixup removing a file that wasn't added
- Remove a blank line
v7:
- Fixup the #ifdefs to keep the test robot happy
v6:
- Use "feature" instead of protocol
- Don't use any devm_* functions
- Add two more patches to the series
v5:
- Return the file name as the file contents
- Code cleanups and simplifications
v4:
- Fixup typos in the documentation
- Make it clear that the file names contain the information
- Small code cleanups
- Remove most #ifdefs
- Remove extra NULL assignment
v3:
- Expose each DOE feature as a separate file
v2:
- Add documentation
- Code cleanups
Documentation/ABI/testing/sysfs-bus-pci | 28 ++++++
drivers/pci/doe.c | 109 +++++++++++++++++++++++-
drivers/pci/pci-sysfs.c | 4 +
drivers/pci/pci.h | 2 +
4 files changed, 142 insertions(+), 1 deletion(-)
diff --git a/Documentation/ABI/testing/sysfs-bus-pci b/Documentation/ABI/testing/sysfs-bus-pci
index ecf47559f495..e1b8f15e4a3a 100644
--- a/Documentation/ABI/testing/sysfs-bus-pci
+++ b/Documentation/ABI/testing/sysfs-bus-pci
@@ -500,3 +500,31 @@ Description:
console drivers from the device. Raw users of pci-sysfs
resourceN attributes must be terminated prior to resizing.
Success of the resizing operation is not guaranteed.
+
+What: /sys/bus/pci/devices/.../doe_features
+Date: July 2024
+Contact: Linux PCI developers <linux-pci@vger.kernel.org>
+Description:
+ This directory contains a list of the supported
+ Data Object Exchange (DOE) features. The feature values are
+ the file name. The contents of each file is the raw vendor id and
+ data object feature values, the same as the name.
+
+ The value comes from the device and specifies the vendor and
+ data object type supported. The lower (RHS of the colon) is
+ the data object type in hex. The upper (LHS of the colon)
+ is the vendor ID.
+
+ As all DOE devices must support the DOE discovery protocol, if
+ DOE is supported you will at least see this file, with
+ this contents
+
+ # cat doe_features/0001:00
+ 0001:00
+
+ If the device supports other protocols you will see other files
+ as well. For example is CMA/SPDM and secure CMA/SPDM are supported
+ the doe_features directory will look like this
+
+ # ls doe_features
+ 0001:00 0001:01 0001:02
diff --git a/drivers/pci/doe.c b/drivers/pci/doe.c
index defc4be81bd4..e7b702afce88 100644
--- a/drivers/pci/doe.c
+++ b/drivers/pci/doe.c
@@ -14,6 +14,7 @@
#include <linux/bitfield.h>
#include <linux/delay.h>
+#include <linux/device.h>
#include <linux/jiffies.h>
#include <linux/mutex.h>
#include <linux/pci.h>
@@ -47,6 +48,8 @@
* @wq: Wait queue for work item
* @work_queue: Queue of pci_doe_work items
* @flags: Bit array of PCI_DOE_FLAG_* flags
+ * @device_attrs: Array of device attributes, used in cleanup
+ * @sysfs_attrs: Array of sysfs attributes, used in cleanup
*/
struct pci_doe_mb {
struct pci_dev *pdev;
@@ -56,6 +59,11 @@ struct pci_doe_mb {
wait_queue_head_t wq;
struct workqueue_struct *work_queue;
unsigned long flags;
+
+#ifdef CONFIG_SYSFS
+ struct device_attribute *device_attrs;
+ struct attribute **sysfs_attrs;
+#endif
};
struct pci_doe_feature {
@@ -92,6 +100,58 @@ struct pci_doe_task {
struct pci_doe_mb *doe_mb;
};
+#ifdef CONFIG_SYSFS
+static bool pci_doe_features_sysfs_group_visible(struct kobject *kobj)
+{
+ struct pci_dev *pdev = to_pci_dev(kobj_to_dev(kobj));
+ struct pci_doe_mb *doe_mb;
+ unsigned long index;
+
+ xa_for_each(&pdev->doe_mbs, index, doe_mb) {
+ if (!xa_empty(&doe_mb->feats))
+ return true;
+ }
+
+ return false;
+}
+DEFINE_SIMPLE_SYSFS_GROUP_VISIBLE(pci_doe_features_sysfs)
+
+struct attribute_group pci_doe_sysfs_group = {
+ .name = "doe_features",
+ .is_visible = SYSFS_GROUP_VISIBLE(pci_doe_features_sysfs),
+};
+
+static ssize_t pci_doe_sysfs_feature_show(struct device *dev,
+ struct device_attribute *attr,
+ char *buf)
+{
+ return sysfs_emit(buf, "%s\n", attr->attr.name);
+}
+
+static void pci_doe_sysfs_feature_remove(struct pci_dev *pdev,
+ struct pci_doe_mb *doe_mb)
+{
+ struct device_attribute *attrs = doe_mb->device_attrs;
+ struct attribute **sysfs_attrs = doe_mb->sysfs_attrs;
+ unsigned long i;
+ void *entry;
+
+ if (!attrs)
+ return;
+
+ doe_mb->device_attrs = NULL;
+ doe_mb->sysfs_attrs = NULL;
+
+ xa_for_each(&doe_mb->feats, i, entry) {
+ if (attrs[i].attr.name)
+ kfree(attrs[i].attr.name);
+ }
+
+ kfree(attrs);
+ kfree(sysfs_attrs);
+}
+#endif
+
static int pci_doe_wait(struct pci_doe_mb *doe_mb, unsigned long timeout)
{
if (wait_event_timeout(doe_mb->wq,
@@ -687,6 +747,12 @@ void pci_doe_init(struct pci_dev *pdev)
{
struct pci_doe_mb *doe_mb;
u16 offset = 0;
+ struct attribute **sysfs_attrs;
+ struct device_attribute *attrs;
+ unsigned long num_features = 0;
+ unsigned long i;
+ unsigned long vid, type;
+ void *entry;
int rc;
xa_init(&pdev->doe_mbs);
@@ -707,6 +773,45 @@ void pci_doe_init(struct pci_dev *pdev)
pci_doe_destroy_mb(doe_mb);
}
}
+
+ if (doe_mb) {
+ xa_for_each(&doe_mb->feats, i, entry)
+ num_features++;
+
+ sysfs_attrs = kcalloc(num_features + 1, sizeof(*sysfs_attrs), GFP_KERNEL);
+ if (!sysfs_attrs)
+ return;
+
+ attrs = kcalloc(num_features, sizeof(*attrs), GFP_KERNEL);
+ if (!attrs) {
+ kfree(sysfs_attrs);
+ return;
+ }
+
+ doe_mb->device_attrs = attrs;
+ doe_mb->sysfs_attrs = sysfs_attrs;
+
+ xa_for_each(&doe_mb->feats, i, entry) {
+ sysfs_attr_init(&attrs[i].attr);
+
+ vid = xa_to_value(entry) >> 8;
+ type = xa_to_value(entry) & 0xFF;
+
+ attrs[i].attr.name = kasprintf(GFP_KERNEL, "%04lx:%02lx", vid, type);
+ if (!attrs[i].attr.name) {
+ pci_doe_sysfs_feature_remove(pdev, doe_mb);
+ return;
+ }
+ attrs[i].attr.mode = 0444;
+ attrs[i].show = pci_doe_sysfs_feature_show;
+
+ sysfs_attrs[i] = &attrs[i].attr;
+ }
+
+ sysfs_attrs[num_features] = NULL;
+
+ pci_doe_sysfs_group.attrs = sysfs_attrs;
+ }
}
void pci_doe_destroy(struct pci_dev *pdev)
@@ -714,8 +819,10 @@ void pci_doe_destroy(struct pci_dev *pdev)
struct pci_doe_mb *doe_mb;
unsigned long index;
- xa_for_each(&pdev->doe_mbs, index, doe_mb)
+ xa_for_each(&pdev->doe_mbs, index, doe_mb) {
+ pci_doe_sysfs_feature_remove(pdev, doe_mb);
pci_doe_destroy_mb(doe_mb);
+ }
xa_destroy(&pdev->doe_mbs);
}
diff --git a/drivers/pci/pci-sysfs.c b/drivers/pci/pci-sysfs.c
index 40cfa716392f..cd838b85d6ab 100644
--- a/drivers/pci/pci-sysfs.c
+++ b/drivers/pci/pci-sysfs.c
@@ -16,6 +16,7 @@
#include <linux/kernel.h>
#include <linux/sched.h>
#include <linux/pci.h>
+#include <linux/pci-doe.h>
#include <linux/stat.h>
#include <linux/export.h>
#include <linux/topology.h>
@@ -1661,6 +1662,9 @@ const struct attribute_group *pci_dev_attr_groups[] = {
#endif
#ifdef CONFIG_PCIEASPM
&aspm_ctrl_attr_group,
+#endif
+#ifdef CONFIG_PCI_DOE
+ &pci_doe_sysfs_group,
#endif
NULL,
};
diff --git a/drivers/pci/pci.h b/drivers/pci/pci.h
index fd44565c4756..a26c586cdeb4 100644
--- a/drivers/pci/pci.h
+++ b/drivers/pci/pci.h
@@ -189,6 +189,7 @@ extern const struct attribute_group *pci_dev_groups[];
extern const struct attribute_group *pci_dev_attr_groups[];
extern const struct attribute_group *pcibus_groups[];
extern const struct attribute_group *pci_bus_groups[];
+extern struct attribute_group pci_doe_sysfs_group;
#else
static inline int pci_create_sysfs_dev_files(struct pci_dev *pdev) { return 0; }
static inline void pci_remove_sysfs_dev_files(struct pci_dev *pdev) { }
@@ -196,6 +197,7 @@ static inline void pci_remove_sysfs_dev_files(struct pci_dev *pdev) { }
#define pci_dev_attr_groups NULL
#define pcibus_groups NULL
#define pci_bus_groups NULL
+#define pci_doe_sysfs_group NULL
#endif
extern unsigned long pci_hotplug_io_size;
--
2.45.2
^ permalink raw reply related [flat|nested] 10+ messages in thread
* [PATCH v13 4/4] PCI/DOE: Allow enabling DOE without CXL
2024-07-02 6:04 [PATCH v13 1/4] PCI/DOE: Rename DOE protocol to feature Alistair Francis
2024-07-02 6:04 ` [PATCH v13 2/4] PCI/DOE: Rename Discovery Response Data Object Contents to type Alistair Francis
2024-07-02 6:04 ` [PATCH v13 3/4] PCI/DOE: Expose the DOE features via sysfs Alistair Francis
@ 2024-07-02 6:04 ` Alistair Francis
2 siblings, 0 replies; 10+ messages in thread
From: Alistair Francis @ 2024-07-02 6:04 UTC (permalink / raw)
To: bhelgaas, linux-pci, Jonathan.Cameron, lukas
Cc: alex.williamson, christian.koenig, kch, gregkh, logang,
linux-kernel, alistair23, chaitanyak, rdunlap, Alistair Francis
PCIe devices (not CXL) can support DOE as well, so allow DOE to be
enabled even if CXL isn't.
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
Reviewed-by: Jonathan Cameron <Jonathan.Cameron@huawei.com>
---
drivers/pci/Kconfig | 5 ++++-
1 file changed, 4 insertions(+), 1 deletion(-)
diff --git a/drivers/pci/Kconfig b/drivers/pci/Kconfig
index d35001589d88..09d3f5c8555c 100644
--- a/drivers/pci/Kconfig
+++ b/drivers/pci/Kconfig
@@ -122,7 +122,10 @@ config PCI_ATS
bool
config PCI_DOE
- bool
+ bool "Enable PCI Data Object Exchange (DOE) support"
+ help
+ Say Y here if you want be able to communicate with PCIe DOE
+ mailboxes.
config PCI_ECAM
bool
--
2.45.2
^ permalink raw reply related [flat|nested] 10+ messages in thread
* Re: [PATCH v13 3/4] PCI/DOE: Expose the DOE features via sysfs
2024-07-02 6:04 ` [PATCH v13 3/4] PCI/DOE: Expose the DOE features via sysfs Alistair Francis
@ 2024-07-02 11:57 ` Chaitanya Kulkarni
2024-07-02 13:58 ` Jonathan Cameron
1 sibling, 0 replies; 10+ messages in thread
From: Chaitanya Kulkarni @ 2024-07-02 11:57 UTC (permalink / raw)
To: Alistair Francis, bhelgaas@google.com, linux-pci@vger.kernel.org,
Jonathan.Cameron@huawei.com, lukas@wunner.de
Cc: alex.williamson@redhat.com, christian.koenig@amd.com,
Chaitanya Kulkarni, gregkh@linuxfoundation.org,
logang@deltatee.com, linux-kernel@vger.kernel.org,
rdunlap@infradead.org, Alistair Francis
> @@ -707,6 +773,45 @@ void pci_doe_init(struct pci_dev *pdev)
> pci_doe_destroy_mb(doe_mb);
> }
> }
> +
> + if (doe_mb) {
> + xa_for_each(&doe_mb->feats, i, entry)
> + num_features++;
> +
> + sysfs_attrs = kcalloc(num_features + 1, sizeof(*sysfs_attrs), GFP_KERNEL);
> + if (!sysfs_attrs)
> + return;
> +
> + attrs = kcalloc(num_features, sizeof(*attrs), GFP_KERNEL);
> + if (!attrs) {
> + kfree(sysfs_attrs);
> + return;
> + }
> +
> + doe_mb->device_attrs = attrs;
> + doe_mb->sysfs_attrs = sysfs_attrs;
> +
> + xa_for_each(&doe_mb->feats, i, entry) {
> + sysfs_attr_init(&attrs[i].attr);
> +
> + vid = xa_to_value(entry) >> 8;
> + type = xa_to_value(entry) & 0xFF;
> +
> + attrs[i].attr.name = kasprintf(GFP_KERNEL, "%04lx:%02lx", vid, type);
> + if (!attrs[i].attr.name) {
> + pci_doe_sysfs_feature_remove(pdev, doe_mb);
> + return;
> + }
> + attrs[i].attr.mode = 0444;
> + attrs[i].show = pci_doe_sysfs_feature_show;
> +
> + sysfs_attrs[i] = &attrs[i].attr;
> + }
> +
> + sysfs_attrs[num_features] = NULL;
shouldn't sysfs_attrs[num_features] be already NULL since it's allocated
using kcalloc() ?
> +
> + pci_doe_sysfs_group.attrs = sysfs_attrs;
> + }
-ck
^ permalink raw reply [flat|nested] 10+ messages in thread
* Re: [PATCH v13 3/4] PCI/DOE: Expose the DOE features via sysfs
2024-07-02 6:04 ` [PATCH v13 3/4] PCI/DOE: Expose the DOE features via sysfs Alistair Francis
2024-07-02 11:57 ` Chaitanya Kulkarni
@ 2024-07-02 13:58 ` Jonathan Cameron
2024-07-05 1:24 ` Alistair Francis
1 sibling, 1 reply; 10+ messages in thread
From: Jonathan Cameron @ 2024-07-02 13:58 UTC (permalink / raw)
To: Alistair Francis
Cc: bhelgaas, linux-pci, lukas, alex.williamson, christian.koenig,
kch, gregkh, logang, linux-kernel, chaitanyak, rdunlap,
Alistair Francis
On Tue, 2 Jul 2024 16:04:17 +1000
Alistair Francis <alistair23@gmail.com> wrote:
> The PCIe 6 specification added support for the Data Object
> Exchange (DOE).
> When DOE is supported the DOE Discovery Feature must be implemented per
> PCIe r6.1 sec 6.30.1.1. The protocol allows a requester to obtain
> information about the other DOE features supported by the device.
>
> The kernel is already querying the DOE features supported and cacheing
> the values. Expose the values in sysfs to allow user space to
> determine which DOE features are supported by the PCIe device.
>
> By exposing the information to userspace tools like lspci can relay the
> information to users. By listing all of the supported features we can
> allow userspace to parse the list, which might include
> vendor specific features as well as yet to be supported features.
>
> After this patch is supported you can see something like this when
> attaching a DOE device
>
> $ ls /sys/devices/pci0000:00/0000:00:02.0//doe*
> 0001:00 0001:01 0001:02
>
> Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
> ---
> v13:
> - Drop pci_doe_sysfs_init() and use pci_doe_sysfs_group
> - As discussed in https://lore.kernel.org/all/20231019165829.GA1381099@bhelgaas/
> we can just modify pci_doe_sysfs_group at the DOE init and let
Can't do that as it is global so you expose the same DOE features for
all DOEs.
Also, I think that this is only processing features on last doe_mb found
for a given device. Fix that and the duplicates problem resurfaces.
> device_add() handle the sysfs attributes.
> diff --git a/drivers/pci/doe.c b/drivers/pci/doe.c
> index defc4be81bd4..e7b702afce88 100644
> --- a/drivers/pci/doe.c
> +++ b/drivers/pci/doe.c
> +
> static int pci_doe_wait(struct pci_doe_mb *doe_mb, unsigned long timeout)
> {
> if (wait_event_timeout(doe_mb->wq,
> @@ -687,6 +747,12 @@ void pci_doe_init(struct pci_dev *pdev)
> {
> struct pci_doe_mb *doe_mb;
> u16 offset = 0;
> + struct attribute **sysfs_attrs;
> + struct device_attribute *attrs;
> + unsigned long num_features = 0;
> + unsigned long i;
> + unsigned long vid, type;
> + void *entry;
> int rc;
>
> xa_init(&pdev->doe_mbs);
> @@ -707,6 +773,45 @@ void pci_doe_init(struct pci_dev *pdev)
> pci_doe_destroy_mb(doe_mb);
> }
> }
The above is looping over multiple DOEs but this just considers last one.
That doesn't look right...
I think this needs to be in the loop and having done that
the duplicate handing may be an issue. I'm not sure what happens
in that path with a presupplied set of attributes.
> +
> + if (doe_mb) {
> + xa_for_each(&doe_mb->feats, i, entry)
> + num_features++;
> +
> + sysfs_attrs = kcalloc(num_features + 1, sizeof(*sysfs_attrs), GFP_KERNEL);
> + if (!sysfs_attrs)
> + return;
> +
> + attrs = kcalloc(num_features, sizeof(*attrs), GFP_KERNEL);
> + if (!attrs) {
> + kfree(sysfs_attrs);
> + return;
> + }
> +
> + doe_mb->device_attrs = attrs;
> + doe_mb->sysfs_attrs = sysfs_attrs;
> +
> + xa_for_each(&doe_mb->feats, i, entry) {
> + sysfs_attr_init(&attrs[i].attr);
> +
> + vid = xa_to_value(entry) >> 8;
> + type = xa_to_value(entry) & 0xFF;
> +
> + attrs[i].attr.name = kasprintf(GFP_KERNEL, "%04lx:%02lx", vid, type);
> + if (!attrs[i].attr.name) {
> + pci_doe_sysfs_feature_remove(pdev, doe_mb);
> + return;
> + }
> + attrs[i].attr.mode = 0444;
> + attrs[i].show = pci_doe_sysfs_feature_show;
> +
> + sysfs_attrs[i] = &attrs[i].attr;
> + }
> +
> + sysfs_attrs[num_features] = NULL;
> +
> + pci_doe_sysfs_group.attrs = sysfs_attrs;
Hmm. Isn't this global? What if you have multiple devices.
> + }
> }
>
^ permalink raw reply [flat|nested] 10+ messages in thread
* Re: [PATCH v13 3/4] PCI/DOE: Expose the DOE features via sysfs
2024-07-02 13:58 ` Jonathan Cameron
@ 2024-07-05 1:24 ` Alistair Francis
2024-07-05 10:29 ` Jonathan Cameron
0 siblings, 1 reply; 10+ messages in thread
From: Alistair Francis @ 2024-07-05 1:24 UTC (permalink / raw)
To: Jonathan Cameron
Cc: bhelgaas, linux-pci, lukas, alex.williamson, christian.koenig,
kch, gregkh, logang, linux-kernel, chaitanyak, rdunlap,
Alistair Francis
On Tue, Jul 2, 2024 at 11:58 PM Jonathan Cameron
<Jonathan.Cameron@huawei.com> wrote:
>
> On Tue, 2 Jul 2024 16:04:17 +1000
> Alistair Francis <alistair23@gmail.com> wrote:
>
> > The PCIe 6 specification added support for the Data Object
> > Exchange (DOE).
> > When DOE is supported the DOE Discovery Feature must be implemented per
> > PCIe r6.1 sec 6.30.1.1. The protocol allows a requester to obtain
> > information about the other DOE features supported by the device.
> >
> > The kernel is already querying the DOE features supported and cacheing
> > the values. Expose the values in sysfs to allow user space to
> > determine which DOE features are supported by the PCIe device.
> >
> > By exposing the information to userspace tools like lspci can relay the
> > information to users. By listing all of the supported features we can
> > allow userspace to parse the list, which might include
> > vendor specific features as well as yet to be supported features.
> >
> > After this patch is supported you can see something like this when
> > attaching a DOE device
> >
> > $ ls /sys/devices/pci0000:00/0000:00:02.0//doe*
> > 0001:00 0001:01 0001:02
> >
> > Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
> > ---
> > v13:
> > - Drop pci_doe_sysfs_init() and use pci_doe_sysfs_group
> > - As discussed in https://lore.kernel.org/all/20231019165829.GA1381099@bhelgaas/
> > we can just modify pci_doe_sysfs_group at the DOE init and let
>
> Can't do that as it is global so you expose the same DOE features for
> all DOEs.
>
> Also, I think that this is only processing features on last doe_mb found
> for a given device. Fix that and the duplicates problem resurfaces.
>
>
> > device_add() handle the sysfs attributes.
>
>
> > diff --git a/drivers/pci/doe.c b/drivers/pci/doe.c
> > index defc4be81bd4..e7b702afce88 100644
> > --- a/drivers/pci/doe.c
> > +++ b/drivers/pci/doe.c
>
> > +
> > static int pci_doe_wait(struct pci_doe_mb *doe_mb, unsigned long timeout)
> > {
> > if (wait_event_timeout(doe_mb->wq,
> > @@ -687,6 +747,12 @@ void pci_doe_init(struct pci_dev *pdev)
> > {
> > struct pci_doe_mb *doe_mb;
> > u16 offset = 0;
> > + struct attribute **sysfs_attrs;
> > + struct device_attribute *attrs;
> > + unsigned long num_features = 0;
> > + unsigned long i;
> > + unsigned long vid, type;
> > + void *entry;
> > int rc;
> >
> > xa_init(&pdev->doe_mbs);
> > @@ -707,6 +773,45 @@ void pci_doe_init(struct pci_dev *pdev)
> > pci_doe_destroy_mb(doe_mb);
> > }
> > }
>
> The above is looping over multiple DOEs but this just considers last one.
> That doesn't look right...
Yeah... That isn't
>
> I think this needs to be in the loop and having done that
> the duplicate handing may be an issue. I'm not sure what happens
> in that path with a presupplied set of attributes.
>
> > +
> > + if (doe_mb) {
> > + xa_for_each(&doe_mb->feats, i, entry)
> > + num_features++;
> > +
> > + sysfs_attrs = kcalloc(num_features + 1, sizeof(*sysfs_attrs), GFP_KERNEL);
> > + if (!sysfs_attrs)
> > + return;
> > +
> > + attrs = kcalloc(num_features, sizeof(*attrs), GFP_KERNEL);
> > + if (!attrs) {
> > + kfree(sysfs_attrs);
> > + return;
> > + }
> > +
> > + doe_mb->device_attrs = attrs;
> > + doe_mb->sysfs_attrs = sysfs_attrs;
> > +
> > + xa_for_each(&doe_mb->feats, i, entry) {
> > + sysfs_attr_init(&attrs[i].attr);
> > +
> > + vid = xa_to_value(entry) >> 8;
> > + type = xa_to_value(entry) & 0xFF;
> > +
> > + attrs[i].attr.name = kasprintf(GFP_KERNEL, "%04lx:%02lx", vid, type);
> > + if (!attrs[i].attr.name) {
> > + pci_doe_sysfs_feature_remove(pdev, doe_mb);
> > + return;
> > + }
> > + attrs[i].attr.mode = 0444;
> > + attrs[i].show = pci_doe_sysfs_feature_show;
> > +
> > + sysfs_attrs[i] = &attrs[i].attr;
> > + }
> > +
> > + sysfs_attrs[num_features] = NULL;
> > +
> > + pci_doe_sysfs_group.attrs = sysfs_attrs;
> Hmm. Isn't this global? What if you have multiple devices.
Any input from a PCI maintainer here?
There are basically two approaches.
1. We can have a pci_doe_sysfs_init() function that is called where
we dynamically add the entries, like in v12
2. We can go down the dev->groups and device_add() path, like this
patch and discussed at
https://lore.kernel.org/all/20231019165829.GA1381099@bhelgaas/
For the second we will have to create a global pci_doe_sysfs_group
that contains all possible DOE entries on the system and then have the
show functions determine if they should be displayed for that device.
Everytime we call pci_doe_init() we can check for any missing entries
in pci_doe_sysfs_group.attrs and then realloc
pci_doe_sysfs_group.attrs to add them. Untested, but that should work
even for hot-plugged devices. pci_doe_sysfs_group.attrs would just
grow forever though as I don't think we have an easy way to deallocate
anything as we aren't sure if we are the only entry.
Thoughts?
Alistair
^ permalink raw reply [flat|nested] 10+ messages in thread
* Re: [PATCH v13 3/4] PCI/DOE: Expose the DOE features via sysfs
2024-07-05 1:24 ` Alistair Francis
@ 2024-07-05 10:29 ` Jonathan Cameron
2024-07-08 0:55 ` Krzysztof Wilczyński
0 siblings, 1 reply; 10+ messages in thread
From: Jonathan Cameron @ 2024-07-05 10:29 UTC (permalink / raw)
To: Alistair Francis
Cc: bhelgaas, linux-pci, lukas, alex.williamson, christian.koenig,
kch, gregkh, logang, linux-kernel, chaitanyak, rdunlap,
Alistair Francis
On Fri, 5 Jul 2024 11:24:25 +1000
Alistair Francis <alistair23@gmail.com> wrote:
> On Tue, Jul 2, 2024 at 11:58 PM Jonathan Cameron
> <Jonathan.Cameron@huawei.com> wrote:
> >
> > On Tue, 2 Jul 2024 16:04:17 +1000
> > Alistair Francis <alistair23@gmail.com> wrote:
> >
> > > The PCIe 6 specification added support for the Data Object
> > > Exchange (DOE).
> > > When DOE is supported the DOE Discovery Feature must be implemented per
> > > PCIe r6.1 sec 6.30.1.1. The protocol allows a requester to obtain
> > > information about the other DOE features supported by the device.
> > >
> > > The kernel is already querying the DOE features supported and cacheing
> > > the values. Expose the values in sysfs to allow user space to
> > > determine which DOE features are supported by the PCIe device.
> > >
> > > By exposing the information to userspace tools like lspci can relay the
> > > information to users. By listing all of the supported features we can
> > > allow userspace to parse the list, which might include
> > > vendor specific features as well as yet to be supported features.
> > >
> > > After this patch is supported you can see something like this when
> > > attaching a DOE device
> > >
> > > $ ls /sys/devices/pci0000:00/0000:00:02.0//doe*
> > > 0001:00 0001:01 0001:02
> > >
> > > Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
> > > ---
> > > v13:
> > > - Drop pci_doe_sysfs_init() and use pci_doe_sysfs_group
> > > - As discussed in https://lore.kernel.org/all/20231019165829.GA1381099@bhelgaas/
> > > we can just modify pci_doe_sysfs_group at the DOE init and let
> >
> > Can't do that as it is global so you expose the same DOE features for
> > all DOEs.
> >
> > Also, I think that this is only processing features on last doe_mb found
> > for a given device. Fix that and the duplicates problem resurfaces.
> >
> >
> > > device_add() handle the sysfs attributes.
> >
> >
> > > diff --git a/drivers/pci/doe.c b/drivers/pci/doe.c
> > > index defc4be81bd4..e7b702afce88 100644
> > > --- a/drivers/pci/doe.c
> > > +++ b/drivers/pci/doe.c
> >
> > > +
> > > static int pci_doe_wait(struct pci_doe_mb *doe_mb, unsigned long timeout)
> > > {
> > > if (wait_event_timeout(doe_mb->wq,
> > > @@ -687,6 +747,12 @@ void pci_doe_init(struct pci_dev *pdev)
> > > {
> > > struct pci_doe_mb *doe_mb;
> > > u16 offset = 0;
> > > + struct attribute **sysfs_attrs;
> > > + struct device_attribute *attrs;
> > > + unsigned long num_features = 0;
> > > + unsigned long i;
> > > + unsigned long vid, type;
> > > + void *entry;
> > > int rc;
> > >
> > > xa_init(&pdev->doe_mbs);
> > > @@ -707,6 +773,45 @@ void pci_doe_init(struct pci_dev *pdev)
> > > pci_doe_destroy_mb(doe_mb);
> > > }
> > > }
> >
> > The above is looping over multiple DOEs but this just considers last one.
> > That doesn't look right...
>
> Yeah... That isn't
>
> >
> > I think this needs to be in the loop and having done that
> > the duplicate handing may be an issue. I'm not sure what happens
> > in that path with a presupplied set of attributes.
> >
> > > +
> > > + if (doe_mb) {
> > > + xa_for_each(&doe_mb->feats, i, entry)
> > > + num_features++;
> > > +
> > > + sysfs_attrs = kcalloc(num_features + 1, sizeof(*sysfs_attrs), GFP_KERNEL);
> > > + if (!sysfs_attrs)
> > > + return;
> > > +
> > > + attrs = kcalloc(num_features, sizeof(*attrs), GFP_KERNEL);
> > > + if (!attrs) {
> > > + kfree(sysfs_attrs);
> > > + return;
> > > + }
> > > +
> > > + doe_mb->device_attrs = attrs;
> > > + doe_mb->sysfs_attrs = sysfs_attrs;
> > > +
> > > + xa_for_each(&doe_mb->feats, i, entry) {
> > > + sysfs_attr_init(&attrs[i].attr);
> > > +
> > > + vid = xa_to_value(entry) >> 8;
> > > + type = xa_to_value(entry) & 0xFF;
> > > +
> > > + attrs[i].attr.name = kasprintf(GFP_KERNEL, "%04lx:%02lx", vid, type);
> > > + if (!attrs[i].attr.name) {
> > > + pci_doe_sysfs_feature_remove(pdev, doe_mb);
> > > + return;
> > > + }
> > > + attrs[i].attr.mode = 0444;
> > > + attrs[i].show = pci_doe_sysfs_feature_show;
> > > +
> > > + sysfs_attrs[i] = &attrs[i].attr;
> > > + }
> > > +
> > > + sysfs_attrs[num_features] = NULL;
> > > +
> > > + pci_doe_sysfs_group.attrs = sysfs_attrs;
> > Hmm. Isn't this global? What if you have multiple devices.
>
> Any input from a PCI maintainer here?
>
> There are basically two approaches.
>
> 1. We can have a pci_doe_sysfs_init() function that is called where
> we dynamically add the entries, like in v12
> 2. We can go down the dev->groups and device_add() path, like this
> patch and discussed at
> https://lore.kernel.org/all/20231019165829.GA1381099@bhelgaas/
>
> For the second we will have to create a global pci_doe_sysfs_group
> that contains all possible DOE entries on the system and then have the
> show functions determine if they should be displayed for that device.
>
> Everytime we call pci_doe_init() we can check for any missing entries
> in pci_doe_sysfs_group.attrs and then realloc
> pci_doe_sysfs_group.attrs to add them.
> Untested, but that should work
> even for hot-plugged devices. pci_doe_sysfs_group.attrs would just
> grow forever though as I don't think we have an easy way to deallocate
> anything as we aren't sure if we are the only entry.
I think this needs to be per device, not global and you'll have to manually
do the group visibility magic rather than using the macros.
>
> Thoughts?
>
> Alistair
^ permalink raw reply [flat|nested] 10+ messages in thread
* Re: [PATCH v13 3/4] PCI/DOE: Expose the DOE features via sysfs
2024-07-05 10:29 ` Jonathan Cameron
@ 2024-07-08 0:55 ` Krzysztof Wilczyński
2024-07-09 0:50 ` Alistair Francis
0 siblings, 1 reply; 10+ messages in thread
From: Krzysztof Wilczyński @ 2024-07-08 0:55 UTC (permalink / raw)
To: Jonathan Cameron
Cc: Alistair Francis, bhelgaas, linux-pci, lukas, alex.williamson,
christian.koenig, kch, gregkh, logang, linux-kernel, chaitanyak,
rdunlap, Alistair Francis
Hello,
> > Any input from a PCI maintainer here?
Something that I am curious about: can we make this a single file with a
bitmask inside that denotes what DOE features are enabled? Would this be
approach be even feasible here?
Thoughts? Or is it too late to think about this now?
> > There are basically two approaches.
> >
> > 1. We can have a pci_doe_sysfs_init() function that is called where
> > we dynamically add the entries, like in v12
> > 2. We can go down the dev->groups and device_add() path, like this
> > patch and discussed at
> > https://lore.kernel.org/all/20231019165829.GA1381099@bhelgaas/
> >
> > For the second we will have to create a global pci_doe_sysfs_group
> > that contains all possible DOE entries on the system and then have the
> > show functions determine if they should be displayed for that device.
> >
> > Everytime we call pci_doe_init() we can check for any missing entries
> > in pci_doe_sysfs_group.attrs and then realloc
> > pci_doe_sysfs_group.attrs to add them.
> > Untested, but that should work
> > even for hot-plugged devices. pci_doe_sysfs_group.attrs would just
> > grow forever though as I don't think we have an easy way to deallocate
> > anything as we aren't sure if we are the only entry.
>
> I think this needs to be per device, not global and you'll have to manually
> do the group visibility magic rather than using the macros.
Lukas proposes a very interesting feature of kernfs recently per:
https://lore.kernel.org/linux-pci/16490618cbde91b5aac04873c39c8fb7666ff686.1719771133.git.lukas@wunner.de
Would this help with DOE features?
Krzysztof
^ permalink raw reply [flat|nested] 10+ messages in thread
* Re: [PATCH v13 3/4] PCI/DOE: Expose the DOE features via sysfs
2024-07-08 0:55 ` Krzysztof Wilczyński
@ 2024-07-09 0:50 ` Alistair Francis
0 siblings, 0 replies; 10+ messages in thread
From: Alistair Francis @ 2024-07-09 0:50 UTC (permalink / raw)
To: Krzysztof Wilczyński
Cc: Jonathan Cameron, bhelgaas, linux-pci, lukas, alex.williamson,
christian.koenig, kch, gregkh, logang, linux-kernel, chaitanyak,
rdunlap, Alistair Francis
On Mon, Jul 8, 2024 at 10:55 AM Krzysztof Wilczyński <kw@linux.com> wrote:
>
> Hello,
>
> > > Any input from a PCI maintainer here?
>
> Something that I am curious about: can we make this a single file with a
> bitmask inside that denotes what DOE features are enabled? Would this be
> approach be even feasible here?
In theory there can be any vendor ID (16-bits but not 0xFFFF) and any
feature (8-bits). So there is a huge possibility of values here.
>
> Thoughts? Or is it too late to think about this now?
It's just too many possible options to use a bitmask. I guess we could
use a feature bit mask per vendor if people feel strongly
>
> > > There are basically two approaches.
> > >
> > > 1. We can have a pci_doe_sysfs_init() function that is called where
> > > we dynamically add the entries, like in v12
> > > 2. We can go down the dev->groups and device_add() path, like this
> > > patch and discussed at
> > > https://lore.kernel.org/all/20231019165829.GA1381099@bhelgaas/
> > >
> > > For the second we will have to create a global pci_doe_sysfs_group
> > > that contains all possible DOE entries on the system and then have the
> > > show functions determine if they should be displayed for that device.
> > >
> > > Everytime we call pci_doe_init() we can check for any missing entries
> > > in pci_doe_sysfs_group.attrs and then realloc
> > > pci_doe_sysfs_group.attrs to add them.
> > > Untested, but that should work
> > > even for hot-plugged devices. pci_doe_sysfs_group.attrs would just
> > > grow forever though as I don't think we have an easy way to deallocate
> > > anything as we aren't sure if we are the only entry.
> >
> > I think this needs to be per device, not global and you'll have to manually
> > do the group visibility magic rather than using the macros.
>
> Lukas proposes a very interesting feature of kernfs recently per:
>
> https://lore.kernel.org/linux-pci/16490618cbde91b5aac04873c39c8fb7666ff686.1719771133.git.lukas@wunner.de
>
> Would this help with DOE features?
That was the previous approach used here:
https://lore.kernel.org/linux-pci/20240626045926.680380-3-alistair.francis@wdc.com/
Bjorn wanted to try and avoid using a function pci_doe_sysfs_init()
[1], which is what I tried here. It sounds like the v12 approach is
the way to go then. I'll send a v14 based on v12 with the comments
addressed
1: https://lore.kernel.org/all/20231019165829.GA1381099@bhelgaas/
Alistair
>
> Krzysztof
^ permalink raw reply [flat|nested] 10+ messages in thread
end of thread, other threads:[~2024-07-09 0:50 UTC | newest]
Thread overview: 10+ messages (download: mbox.gz follow: Atom feed
-- links below jump to the message on this page --
2024-07-02 6:04 [PATCH v13 1/4] PCI/DOE: Rename DOE protocol to feature Alistair Francis
2024-07-02 6:04 ` [PATCH v13 2/4] PCI/DOE: Rename Discovery Response Data Object Contents to type Alistair Francis
2024-07-02 6:04 ` [PATCH v13 3/4] PCI/DOE: Expose the DOE features via sysfs Alistair Francis
2024-07-02 11:57 ` Chaitanya Kulkarni
2024-07-02 13:58 ` Jonathan Cameron
2024-07-05 1:24 ` Alistair Francis
2024-07-05 10:29 ` Jonathan Cameron
2024-07-08 0:55 ` Krzysztof Wilczyński
2024-07-09 0:50 ` Alistair Francis
2024-07-02 6:04 ` [PATCH v13 4/4] PCI/DOE: Allow enabling DOE without CXL Alistair Francis
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox