From: Yonatan Nachum <ynachum@amazon.com>
To: <jgg@nvidia.com>, <leon@kernel.org>, <linux-rdma@vger.kernel.org>
Cc: <mrgolin@amazon.com>, <sleybo@amazon.com>, <matua@amazon.com>,
<gal.pressman@linux.dev>, Yonatan Nachum <ynachum@amazon.com>,
Firas Jahjah <firasj@amazon.com>
Subject: [PATCH for-next v5 2/2] RDMA/efa: Add AH cache handling on create and destroy AH
Date: Sun, 28 Jun 2026 13:34:22 +0000 [thread overview]
Message-ID: <20260628133422.523230-3-ynachum@amazon.com> (raw)
In-Reply-To: <20260628133422.523230-1-ynachum@amazon.com>
On create AH, first check if the AH cache entry already exists and if
so, returns the already stored AH number. If the entry doesn't exist,
the driver creates it and calls the device to create the AH. A per-entry
mutex serializes concurrent device commands on the same AH cache entry,
ensuring only one thread issues the device create while others wait and
reuse the result. If the device create fails, the entry's user count
remains zero so subsequent threads will retry the device create.
On destroy AH, the user count is decremented under the entry mutex. If
it reaches zero, the driver issues the device destroy command. After
the device destroy completes, it removes the entry from the hashtable
and frees it if no other references exist. If new users arrived during
the destroy, the entry remains in the hashtable for reuse.
Reviewed-by: Firas Jahjah <firasj@amazon.com>
Reviewed-by: Michael Margolin <mrgolin@amazon.com>
Signed-off-by: Yonatan Nachum <ynachum@amazon.com>
---
drivers/infiniband/hw/efa/efa_ah_cache.c | 94 ++++++++++++++++++++++++
drivers/infiniband/hw/efa/efa_ah_cache.h | 3 +
drivers/infiniband/hw/efa/efa_com_cmd.c | 41 ++++++++++-
drivers/infiniband/hw/efa/efa_com_cmd.h | 1 +
drivers/infiniband/hw/efa/efa_verbs.c | 9 ++-
5 files changed, 140 insertions(+), 8 deletions(-)
diff --git a/drivers/infiniband/hw/efa/efa_ah_cache.c b/drivers/infiniband/hw/efa/efa_ah_cache.c
index 73e810678767..ede967c063b2 100644
--- a/drivers/infiniband/hw/efa/efa_ah_cache.c
+++ b/drivers/infiniband/hw/efa/efa_ah_cache.c
@@ -40,3 +40,97 @@ void efa_ah_cache_destroy(struct efa_ah_cache *ah_cache)
rhashtable_free_and_destroy(&ah_cache->hashtable, efa_ah_cache_entry_free, NULL);
mutex_destroy(&ah_cache->lock);
}
+
+static struct efa_ah_cache_entry *efa_ah_cache_lookup_locked(struct efa_ah_cache *ah_cache, u16 pd,
+ u8 *gid)
+ __must_hold(&ah_cache->lock)
+{
+ struct efa_ah_cache_key key = {};
+
+ memcpy(key.gid, gid, sizeof(key.gid));
+ key.pd = pd;
+
+ return rhashtable_lookup_fast(&ah_cache->hashtable, &key, ah_cache_params);
+}
+
+struct efa_ah_cache_entry *efa_ah_cache_lookup(struct efa_ah_cache *ah_cache, u16 pd, u8 *gid)
+{
+ struct efa_ah_cache_entry *entry;
+
+ mutex_lock(&ah_cache->lock);
+ entry = efa_ah_cache_lookup_locked(ah_cache, pd, gid);
+ mutex_unlock(&ah_cache->lock);
+
+ return entry;
+}
+
+/**
+ * efa_ah_cache_get - Get or create an AH cache entry
+ * @ah_cache: AH cache
+ * @pd: Protection domain number
+ * @gid: GID address
+ *
+ * Look up an AH cache entry by PD and GID. If found, take a reference and
+ * return it. If not found, allocate a new entry and insert it. The caller must lock
+ * the entry mutex and check usecnt to determine whether a device create
+ * command is needed.
+ *
+ * Return: Pointer to the entry on success, ERR_PTR on failure.
+ */
+struct efa_ah_cache_entry *efa_ah_cache_get(struct efa_ah_cache *ah_cache, u16 pd, u8 *gid)
+{
+ struct efa_ah_cache_entry *entry;
+ int err;
+
+ mutex_lock(&ah_cache->lock);
+
+ entry = efa_ah_cache_lookup_locked(ah_cache, pd, gid);
+ if (entry) {
+ refcount_inc(&entry->refcount);
+ mutex_unlock(&ah_cache->lock);
+ return entry;
+ }
+
+ entry = kzalloc(sizeof(*entry), GFP_KERNEL);
+ if (!entry) {
+ mutex_unlock(&ah_cache->lock);
+ return ERR_PTR(-ENOMEM);
+ }
+
+ memcpy(entry->key.gid, gid, sizeof(entry->key.gid));
+ entry->key.pd = pd;
+ refcount_set(&entry->refcount, 1);
+ mutex_init(&entry->lock);
+
+ err = rhashtable_insert_fast(&ah_cache->hashtable, &entry->linkage, ah_cache_params);
+ if (err) {
+ mutex_destroy(&entry->lock);
+ kfree(entry);
+ mutex_unlock(&ah_cache->lock);
+ return ERR_PTR(err);
+ }
+
+ mutex_unlock(&ah_cache->lock);
+ return entry;
+}
+
+/**
+ * efa_ah_cache_put - Put a refcount of an AH cache entry
+ * @ah_cache: AH cache
+ * @entry: AH cache entry
+ *
+ * Drop the refcount. If it reaches zero, remove the entry from the hashtable
+ * and free it.
+ */
+void efa_ah_cache_put(struct efa_ah_cache *ah_cache, struct efa_ah_cache_entry *entry)
+{
+ if (!refcount_dec_and_mutex_lock(&entry->refcount, &ah_cache->lock))
+ return;
+
+ /* AH cache lock is held here */
+ rhashtable_remove_fast(&ah_cache->hashtable, &entry->linkage, ah_cache_params);
+ mutex_unlock(&ah_cache->lock);
+
+ mutex_destroy(&entry->lock);
+ kfree_rcu(entry, rcu_head);
+}
diff --git a/drivers/infiniband/hw/efa/efa_ah_cache.h b/drivers/infiniband/hw/efa/efa_ah_cache.h
index 42ba17a482c3..4315bba1f880 100644
--- a/drivers/infiniband/hw/efa/efa_ah_cache.h
+++ b/drivers/infiniband/hw/efa/efa_ah_cache.h
@@ -33,5 +33,8 @@ struct efa_ah_cache {
int efa_ah_cache_init(struct efa_ah_cache *ah_cache);
void efa_ah_cache_destroy(struct efa_ah_cache *ah_cache);
+struct efa_ah_cache_entry *efa_ah_cache_get(struct efa_ah_cache *ah_cache, u16 pd, u8 *gid);
+struct efa_ah_cache_entry *efa_ah_cache_lookup(struct efa_ah_cache *ah_cache, u16 pd, u8 *gid);
+void efa_ah_cache_put(struct efa_ah_cache *ah_cache, struct efa_ah_cache_entry *entry);
#endif /* _EFA_AH_CACHE_H_ */
diff --git a/drivers/infiniband/hw/efa/efa_com_cmd.c b/drivers/infiniband/hw/efa/efa_com_cmd.c
index 5db4f5805b59..0b96862c2787 100644
--- a/drivers/infiniband/hw/efa/efa_com_cmd.c
+++ b/drivers/infiniband/hw/efa/efa_com_cmd.c
@@ -322,8 +322,21 @@ int efa_com_create_ah(struct efa_com_dev *edev,
struct efa_admin_create_ah_resp cmd_completion;
struct efa_com_admin_queue *aq = &edev->aq;
struct efa_admin_create_ah_cmd ah_cmd = {};
+ struct efa_ah_cache_entry *entry;
int err;
+ entry = efa_ah_cache_get(&edev->ah_cache, params->pdn, params->dest_addr);
+ if (IS_ERR(entry))
+ return PTR_ERR(entry);
+
+ mutex_lock(&entry->lock);
+ if (entry->usecnt) {
+ result->ah = entry->ah;
+ entry->usecnt++;
+ mutex_unlock(&entry->lock);
+ return 0;
+ }
+
ah_cmd.aq_common_desc.opcode = EFA_ADMIN_CREATE_AH;
memcpy(ah_cmd.dest_addr, params->dest_addr, sizeof(ah_cmd.dest_addr));
@@ -335,13 +348,18 @@ int efa_com_create_ah(struct efa_com_dev *edev,
(struct efa_admin_acq_entry *)&cmd_completion,
sizeof(cmd_completion));
if (err) {
+ mutex_unlock(&entry->lock);
+ efa_ah_cache_put(&edev->ah_cache, entry);
ibdev_err_ratelimited(edev->efa_dev,
"Failed to create ah for %pI6 [%d]\n",
ah_cmd.dest_addr, err);
return err;
}
+ entry->ah = cmd_completion.ah;
result->ah = cmd_completion.ah;
+ entry->usecnt++;
+ mutex_unlock(&entry->lock);
return 0;
}
@@ -352,11 +370,20 @@ int efa_com_destroy_ah(struct efa_com_dev *edev,
struct efa_admin_destroy_ah_resp cmd_completion;
struct efa_admin_destroy_ah_cmd ah_cmd = {};
struct efa_com_admin_queue *aq = &edev->aq;
- int err;
+ struct efa_ah_cache_entry *entry;
+ int err = 0;
+
+ entry = efa_ah_cache_lookup(&edev->ah_cache, params->pdn, params->gid);
+ if (!entry)
+ return -EINVAL;
+
+ mutex_lock(&entry->lock);
+ if (entry->usecnt > 1)
+ goto out_put;
ah_cmd.aq_common_desc.opcode = EFA_ADMIN_DESTROY_AH;
- ah_cmd.ah = params->ah;
- ah_cmd.pd = params->pdn;
+ ah_cmd.ah = entry->ah;
+ ah_cmd.pd = entry->key.pd;
err = efa_com_cmd_exec(aq,
(struct efa_admin_aq_entry *)&ah_cmd,
@@ -364,13 +391,19 @@ int efa_com_destroy_ah(struct efa_com_dev *edev,
(struct efa_admin_acq_entry *)&cmd_completion,
sizeof(cmd_completion));
if (err) {
+ mutex_unlock(&entry->lock);
ibdev_err_ratelimited(edev->efa_dev,
"Failed to destroy ah-%d pd-%d [%d]\n",
ah_cmd.ah, ah_cmd.pd, err);
return err;
}
- return 0;
+out_put:
+ entry->usecnt--;
+ mutex_unlock(&entry->lock);
+ efa_ah_cache_put(&edev->ah_cache, entry);
+
+ return err;
}
bool
diff --git a/drivers/infiniband/hw/efa/efa_com_cmd.h b/drivers/infiniband/hw/efa/efa_com_cmd.h
index ef15b3c38429..39bd4e06684a 100644
--- a/drivers/infiniband/hw/efa/efa_com_cmd.h
+++ b/drivers/infiniband/hw/efa/efa_com_cmd.h
@@ -106,6 +106,7 @@ struct efa_com_create_ah_result {
struct efa_com_destroy_ah_params {
u16 ah;
+ u8 gid[EFA_GID_SIZE];
u16 pdn;
};
diff --git a/drivers/infiniband/hw/efa/efa_verbs.c b/drivers/infiniband/hw/efa/efa_verbs.c
index 5bb00cb85775..eb10aeedd31b 100644
--- a/drivers/infiniband/hw/efa/efa_verbs.c
+++ b/drivers/infiniband/hw/efa/efa_verbs.c
@@ -2045,10 +2045,11 @@ int efa_mmap(struct ib_ucontext *ibucontext,
static int efa_ah_destroy(struct efa_dev *dev, struct efa_ah *ah)
{
- struct efa_com_destroy_ah_params params = {
- .ah = ah->ah,
- .pdn = to_epd(ah->ibah.pd)->pdn,
- };
+ struct efa_com_destroy_ah_params params = {};
+
+ params.ah = ah->ah;
+ memcpy(params.gid, ah->id, sizeof(params.gid));
+ params.pdn = to_epd(ah->ibah.pd)->pdn;
return efa_com_destroy_ah(&dev->edev, ¶ms);
}
--
2.50.1
prev parent reply other threads:[~2026-06-28 13:34 UTC|newest]
Thread overview: 3+ messages / expand[flat|nested] mbox.gz Atom feed top
2026-06-28 13:34 [PATCH for-next v5 0/2] RDMA/efa: Add AH cache for AH reuse Yonatan Nachum
2026-06-28 13:34 ` [PATCH for-next v5 1/2] RDMA/efa: Add initialization of AH cache rhashtable Yonatan Nachum
2026-06-28 13:34 ` Yonatan Nachum [this message]
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=20260628133422.523230-3-ynachum@amazon.com \
--to=ynachum@amazon.com \
--cc=firasj@amazon.com \
--cc=gal.pressman@linux.dev \
--cc=jgg@nvidia.com \
--cc=leon@kernel.org \
--cc=linux-rdma@vger.kernel.org \
--cc=matua@amazon.com \
--cc=mrgolin@amazon.com \
--cc=sleybo@amazon.com \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox