Re: [PATCH net-next v28 4/8] eea: create/destroy rx,tx queues for netdevice open and stop

public inbox for netdev@vger.kernel.org
 help / color / mirror / Atom feed

From: Xuan Zhuo <xuanzhuo@linux.alibaba.com>
To: Paolo Abeni <pabeni@redhat.com>
Cc: Andrew Lunn <andrew+netdev@lunn.ch>,
	"David S. Miller" <davem@davemloft.net>,
	Eric Dumazet <edumazet@google.com>,
	Jakub Kicinski <kuba@kernel.org>,
	Wen Gu <guwen@linux.alibaba.com>,
	Philo Lu <lulie@linux.alibaba.com>,
	Lorenzo Bianconi <lorenzo@kernel.org>,
	Vadim Fedorenko <vadim.fedorenko@linux.dev>,
	Dong Yibo <dong100@mucse.com>,
	Heiner Kallweit <hkallweit1@gmail.com>,
	Lukas Bulwahn <lukas.bulwahn@redhat.com>,
	Dust Li <dust.li@linux.alibaba.com>,
	netdev@vger.kernel.org
Subject: Re: [PATCH net-next v28 4/8] eea: create/destroy rx,tx queues for netdevice open and stop
Date: Mon, 9 Mar 2026 16:51:08 +0800	[thread overview]
Message-ID: <1773046268.140821-1-xuanzhuo@linux.alibaba.com> (raw)
In-Reply-To: <e6c3b053-75d7-46b5-9fd0-ac6de498456f@redhat.com>

On Thu, 5 Mar 2026 11:16:32 +0100, Paolo Abeni <pabeni@redhat.com> wrote:
> On 3/2/26 3:46 AM, Xuan Zhuo wrote:
> > Add basic driver framework for the Alibaba Elastic Ethernet Adapter(EEA).
> >
> > This commit introduces the implementation for the netdevice open and
> > stop.
> >
> > Reviewed-by: Dust Li <dust.li@linux.alibaba.com>
> > Reviewed-by: Philo Lu <lulie@linux.alibaba.com>
> > Signed-off-by: Wen Gu <guwen@linux.alibaba.com>
> > Signed-off-by: Xuan Zhuo <xuanzhuo@linux.alibaba.com>
> > ---
> >  drivers/net/ethernet/alibaba/eea/Makefile  |   4 +-
> >  drivers/net/ethernet/alibaba/eea/eea_net.c | 530 ++++++++++++++++++++-
> >  drivers/net/ethernet/alibaba/eea/eea_net.h |  45 ++
> >  drivers/net/ethernet/alibaba/eea/eea_pci.c | 182 ++++++-
> >  drivers/net/ethernet/alibaba/eea/eea_pci.h |  13 +
> >  drivers/net/ethernet/alibaba/eea/eea_rx.c  | 254 ++++++++++
> >  drivers/net/ethernet/alibaba/eea/eea_tx.c  | 104 ++++
> >  7 files changed, 1127 insertions(+), 5 deletions(-)
> >  create mode 100644 drivers/net/ethernet/alibaba/eea/eea_rx.c
> >  create mode 100644 drivers/net/ethernet/alibaba/eea/eea_tx.c
> >
> > diff --git a/drivers/net/ethernet/alibaba/eea/Makefile b/drivers/net/ethernet/alibaba/eea/Makefile
> > index 91f318e8e046..fa34a005fa01 100644
> > --- a/drivers/net/ethernet/alibaba/eea/Makefile
> > +++ b/drivers/net/ethernet/alibaba/eea/Makefile
> > @@ -3,4 +3,6 @@ obj-$(CONFIG_EEA) += eea.o
> >  eea-y := eea_ring.o \
> >  	eea_net.o \
> >  	eea_pci.o \
> > -	eea_adminq.o
> > +	eea_adminq.o \
> > +	eea_tx.o \
> > +	eea_rx.o
> > diff --git a/drivers/net/ethernet/alibaba/eea/eea_net.c b/drivers/net/ethernet/alibaba/eea/eea_net.c
> > index 31cb9ca5b408..2ebf0053d05e 100644
> > --- a/drivers/net/ethernet/alibaba/eea/eea_net.c
> > +++ b/drivers/net/ethernet/alibaba/eea/eea_net.c
> > @@ -18,6 +18,453 @@
> >
> >  #define EEA_SPLIT_HDR_SIZE 128
> >
> > +static irqreturn_t eea_irq_handler(int irq, void *data)
> > +{
> > +	struct eea_irq_blk *blk = data;
> > +
> > +	napi_schedule_irqoff(&blk->napi);
> > +
> > +	return IRQ_HANDLED;
> > +}
> > +
> > +static void eea_free_irq_blk(struct eea_net *enet)
> > +{
> > +	struct eea_irq_blk *blk;
> > +	u32 num;
> > +	int i;
> > +
> > +	if (!enet->irq_blks)
> > +		return;
> > +
> > +	num = enet->edev->rx_num;
> > +
> > +	for (i = 0; i < num; i++) {
> > +		blk = &enet->irq_blks[i];
> > +
> > +		if (blk->ready)
> > +			eea_pci_free_irq(blk);
> > +
> > +		blk->ready = false;
> > +	}
> > +
> > +	kvfree(enet->irq_blks);
> > +	enet->irq_blks = NULL;
> > +}
> > +
> > +static int eea_alloc_irq_blks(struct eea_net *enet, u32 num)
> > +{
> > +	struct eea_device *edev = enet->edev;
> > +	struct eea_irq_blk *blk, *irq_blks;
> > +	int i, err;
> > +
> > +	irq_blks = kvcalloc(num, sizeof(*blk), GFP_KERNEL);
> > +	if (!irq_blks)
> > +		return -ENOMEM;
> > +
> > +	enet->irq_blks = irq_blks;
> > +
> > +	for (i = 0; i < num; i++) {
> > +		blk = &irq_blks[i];
> > +		blk->idx = i;
> > +
> > +		/* vec 0 is for error notify. */
> > +		blk->msix_vec = i + 1;
> > +
> > +		err = eea_pci_request_irq(edev, blk, eea_irq_handler);
> > +		if (err)
> > +			goto err_free_irq_blk;
> > +
> > +		blk->ready = true;
> > +	}
> > +
> > +	return 0;
> > +
> > +err_free_irq_blk:
> > +	eea_free_irq_blk(enet);
> > +	return err;
> > +}
> > +
> > +static int eea_update_queues(struct eea_net *enet)
> > +{
> > +	return netif_set_real_num_queues(enet->netdev, enet->cfg.tx_ring_num,
> > +					 enet->cfg.rx_ring_num);
> > +}
> > +
> > +void eea_init_ctx(struct eea_net *enet, struct eea_net_init_ctx *ctx)
> > +{
> > +	memset(ctx, 0, sizeof(*ctx));
> > +
> > +	ctx->netdev = enet->netdev;
> > +	ctx->edev = enet->edev;
> > +	ctx->cfg = enet->cfg;
> > +}
> > +
> > +static void eea_bind_q_and_cfg(struct eea_net *enet,
> > +			       struct eea_net_init_ctx *ctx)
> > +{
> > +	struct eea_irq_blk *blk;
> > +	struct eea_net_rx *rx;
> > +	struct eea_net_tx *tx;
> > +	int i;
> > +
> > +	enet->cfg = ctx->cfg;
> > +	enet->rx = ctx->rx;
> > +	enet->tx = ctx->tx;
> > +
> > +	for (i = 0; i < ctx->cfg.rx_ring_num; i++) {
> > +		blk = &enet->irq_blks[i];
> > +
> > +		rx = ctx->rx[i];
> > +		tx = &ctx->tx[i];
> > +
> > +		rx->enet = enet;
> > +		rx->napi = &blk->napi;
> > +		rx->ering->msix_vec = blk->msix_vec;
> > +
> > +		tx->enet = enet;
> > +		tx->ering->msix_vec = blk->msix_vec;
> > +
> > +		blk->rx = rx;
> > +	}
> > +}
> > +
> > +static void eea_unbind_q_and_cfg(struct eea_net *enet,
> > +				 struct eea_net_init_ctx *ctx)
> > +{
> > +	struct eea_irq_blk *blk;
> > +	struct eea_net_rx *rx;
> > +	int i;
> > +
> > +	ctx->cfg = enet->cfg;
> > +	ctx->rx = enet->rx;
> > +	ctx->tx = enet->tx;
> > +
> > +	enet->rx = NULL;
> > +	enet->tx = NULL;
> > +
> > +	for (i = 0; i < ctx->cfg.rx_ring_num; i++) {
> > +		blk = &enet->irq_blks[i];
> > +
> > +		rx = ctx->rx[i];
> > +
> > +		rx->napi = NULL;
> > +
> > +		blk->rx = NULL;
> > +	}
> > +}
> > +
> > +static void eea_free_rxtx_q_mem(struct eea_net_init_ctx *ctx)
> > +{
> > +	struct eea_net_rx *rx;
> > +	struct eea_net_tx *tx;
> > +	int i;
> > +
> > +	for (i = 0; i < ctx->cfg.rx_ring_num; i++) {
> > +		rx = ctx->rx[i];
> > +		tx = &ctx->tx[i];
> > +
> > +		eea_free_rx(rx, &ctx->cfg);
> > +		eea_free_tx(tx, &ctx->cfg);
> > +	}
> > +
> > +	kvfree(ctx->rx);
> > +	kvfree(ctx->tx);
> > +}
> > +
> > +/* alloc tx/rx: struct, ring, meta, pp, napi */
> > +static int eea_alloc_rxtx_q_mem(struct eea_net_init_ctx *ctx)
> > +{
> > +	struct eea_net_rx *rx;
> > +	struct eea_net_tx *tx;
> > +	int err, i;
> > +
> > +	ctx->tx = kvcalloc(ctx->cfg.tx_ring_num, sizeof(*ctx->tx), GFP_KERNEL);
> > +	if (!ctx->tx)
> > +		return -ENOMEM;
> > +
> > +	ctx->rx = kvcalloc(ctx->cfg.rx_ring_num, sizeof(*ctx->rx), GFP_KERNEL);
> > +	if (!ctx->rx)
> > +		goto err_free_tx;
> > +
> > +	ctx->cfg.rx_sq_desc_size = sizeof(struct eea_rx_desc);
> > +	ctx->cfg.rx_cq_desc_size = sizeof(struct eea_rx_cdesc);
> > +	ctx->cfg.tx_sq_desc_size = sizeof(struct eea_tx_desc);
> > +	ctx->cfg.tx_cq_desc_size = sizeof(struct eea_tx_cdesc);
> > +
> > +	ctx->cfg.tx_cq_desc_size /= 2;
> > +
> > +	if (!ctx->cfg.split_hdr)
> > +		ctx->cfg.rx_sq_desc_size /= 2;
> > +
> > +	for (i = 0; i < ctx->cfg.rx_ring_num; i++) {
> > +		rx = eea_alloc_rx(ctx, i);
> > +		if (!rx)
> > +			goto err_free;
> > +
> > +		ctx->rx[i] = rx;
> > +
> > +		tx = ctx->tx + i;
> > +		err = eea_alloc_tx(ctx, tx, i);
> > +		if (err)
> > +			goto err_free;
> > +	}
> > +
> > +	return 0;
> > +
> > +err_free:
> > +	for (i = 0; i < ctx->cfg.rx_ring_num; i++) {
> > +		rx = ctx->rx[i];
> > +		tx = ctx->tx + i;
> > +
> > +		eea_free_rx(rx, &ctx->cfg);
> > +		eea_free_tx(tx, &ctx->cfg);
> > +	}
> > +
> > +	kvfree(ctx->rx);
> > +
> > +err_free_tx:
> > +	kvfree(ctx->tx);
> > +	return -ENOMEM;
> > +}
> > +
> > +static int eea_hw_active_ring(struct eea_net *enet)
> > +{
> > +	return eea_adminq_create_q(enet, /* qidx = */ 0,
> > +				   enet->cfg.rx_ring_num +
> > +				   enet->cfg.tx_ring_num, 0);
> > +}
> > +
> > +static int eea_hw_unactive_ring(struct eea_net *enet)
> > +{
> > +	int err;
> > +
> > +	err = eea_adminq_destroy_all_q(enet);
> > +	if (err)
> > +		netdev_warn(enet->netdev, "unactive rxtx ring failed.\n");
> > +
> > +	return err;
> > +}
> > +
> > +/* stop rx napi, stop tx queue. */
> > +static void eea_stop_rxtx(struct net_device *netdev)
> > +{
> > +	struct eea_net *enet = netdev_priv(netdev);
> > +	int i;
> > +
> > +	netif_tx_disable(netdev);
> > +
> > +	for (i = 0; i < enet->cfg.rx_ring_num; i++)
> > +		enet_rx_stop(enet->rx[i]);
> > +
> > +	netif_carrier_off(netdev);
> > +}
> > +
> > +static void eea_start_rxtx(struct eea_net *enet)
> > +{
> > +	int i;
> > +
> > +	for (i = 0; i < enet->cfg.rx_ring_num; i++)
> > +		enet_rx_start(enet->rx[i]);
> > +
> > +	netif_tx_start_all_queues(enet->netdev);
> > +	netif_carrier_on(enet->netdev);
> > +
> > +	enet->started = true;
> > +}
> > +
> > +static int eea_netdev_stop(struct net_device *netdev)
> > +{
> > +	struct eea_net *enet = netdev_priv(netdev);
> > +	struct eea_net_init_ctx ctx;
> > +
> > +	/* This function can be called during device anomaly recovery. To
> > +	 * prevent duplicate stop operations, the `started` flag is introduced
> > +	 * for checking.
> > +	 */
> > +
> > +	if (!enet->started) {
> > +		netdev_warn(netdev, "eea netdev stop: but dev is not started.\n");
> > +		return 0;
> > +	}
> > +
> > +	eea_stop_rxtx(netdev);
> > +	eea_hw_unactive_ring(enet);
> > +	eea_unbind_q_and_cfg(enet, &ctx);
> > +	eea_free_rxtx_q_mem(&ctx);
> > +
> > +	enet->started = false;
> > +
> > +	return 0;
> > +}
> > +
> > +static int eea_netdev_open(struct net_device *netdev)
> > +{
> > +	struct eea_net *enet = netdev_priv(netdev);
> > +	struct eea_net_init_ctx ctx;
> > +	int err;
> > +
> > +	if (enet->link_err) {
> > +		netdev_err(netdev, "netdev open err, because link error: %d\n",
> > +			   enet->link_err);
> > +		return -EBUSY;
> > +	}
> > +
> > +	eea_init_ctx(enet, &ctx);
> > +
> > +	err = eea_alloc_rxtx_q_mem(&ctx);
> > +	if (err)
> > +		goto err_done;
> > +
> > +	eea_bind_q_and_cfg(enet, &ctx);
> > +
> > +	err = eea_update_queues(enet);
> > +	if (err)
> > +		goto err_free_q;
> > +
> > +	err = eea_hw_active_ring(enet);
> > +	if (err)
> > +		goto err_free_q;
> > +
> > +	eea_start_rxtx(enet);
> > +
> > +	return 0;
> > +
> > +err_free_q:
> > +	eea_unbind_q_and_cfg(enet, &ctx);
> > +	eea_free_rxtx_q_mem(&ctx);
> > +
> > +err_done:
> > +	return err;
> > +}
> > +
> > +/* resources: ring, buffers, irq */
> > +int eea_reset_hw_resources(struct eea_net *enet, struct eea_net_init_ctx *ctx)
> > +{
> > +	struct eea_net_init_ctx ctx_old = {0};
> > +	int err, error;
> > +
> > +	if (!netif_running(enet->netdev) || !enet->started) {
> > +		enet->cfg = ctx->cfg;
> > +		return 0;
> > +	}
> > +
> > +	err = eea_alloc_rxtx_q_mem(ctx);
> > +	if (err) {
> > +		netdev_warn(enet->netdev,
> > +			    "eea reset: alloc q failed. stop reset. err %d\n",
> > +			    err);
> > +		return err;
> > +	}
> > +
> > +	eea_stop_rxtx(enet->netdev);
> > +	eea_hw_unactive_ring(enet);
> > +
> > +	eea_unbind_q_and_cfg(enet, &ctx_old);
> > +	eea_bind_q_and_cfg(enet, ctx);
> > +
> > +	err = eea_update_queues(enet);
> > +	if (err) {
> > +		netdev_err(enet->netdev,
> > +			   "eea reset: set real num queues failed. err %d\n",
> > +			   err);
> > +		goto err_bind_old;
> > +	}
> > +
> > +	err = eea_hw_active_ring(enet);
>
> AFAICS the need for admins queue destroy and recreation on cfg change is
> what prevents a safe configuration swap (together with irq allocation,
> see below). Could you instead keep the admin queue always alive i.e.
> with maximum number of erings configured, and just enable/them as needded?
>
> If not, please document explicitly the constraint in the commit message.

Generally, during I/O queue reconstruction, the admin queue is not rebuilt.
However, in HA scenarios—which represent a special case—
the DPU notifies the driver to request re-initialization. In this specific
situation, the admin queue will also be rebuilt.

>
> [...]
> > @@ -140,14 +591,65 @@ static struct eea_net *eea_netdev_alloc(struct eea_device *edev, u32 pairs)
> >  	enet->edev = edev;
> >  	edev->enet = enet;
> >
> > +	err = eea_alloc_irq_blks(enet, pairs);
> > +	if (err) {
>
> I'm likely lost, but AFAICS eea_alloc_irq_blks() is invoked only here,
> and allocates edev->rx_num interrupts. rx_num is the number of RX
> channel at device probe time.
>
> set_channels can later change such value, i.e. increasing it. But I
> don't see other irqs allocated.


No, set_channels just change enet.cfg.rx_num, edev->rx_num is readonly.

Thanks.

>
> Also the irq handler takes a direct pointer to the napi struct, as
> opposed to Jakub's suggestion of using a ptr to a p
>
> > +		dev_err(edev->dma_dev,
> > +			"eea_alloc_irq_blks failed with pairs %d\n", pairs);
> > +		free_netdev(netdev);
> > +		return NULL;
> > +	}
> > +
> >  	return enet;
> >  }
> >
> > +static void eea_update_ts_off(struct eea_device *edev, struct eea_net *enet)
> > +{
> > +	u64 ts;
> > +
> > +	ts = eea_pci_device_ts(edev);
> > +
> > +	enet->hw_ts_offset = ktime_get_real() - ts;
> > +}
> > +
> > +static int eea_net_reprobe(struct eea_device *edev)
> > +{
> > +	struct eea_net *enet = edev->enet;
> > +	int err = 0;
> > +
> > +	enet->edev = edev;
> > +
> > +	if (!enet->adminq.ring) {
> > +		err = eea_create_adminq(enet, edev->rx_num + edev->tx_num);
> > +		if (err)
> > +			return err;
> > +	}
> > +
> > +	err = eea_alloc_irq_blks(enet, edev->rx_num);
> > +	if (err) {
> > +		eea_destroy_adminq(enet);
> > +		return -ENOMEM;
> > +	}
> > +
> > +	eea_update_ts_off(edev, enet);
> > +
> > +	if (edev->ha_reset_netdev_running) {
> > +		rtnl_lock();
> > +		enet->link_err = 0;
> > +		err = eea_netdev_open(enet->netdev);
> > +		rtnl_unlock();
> > +	}
> > +
> > +	return err;
> > +}
> > +
> >  int eea_net_probe(struct eea_device *edev)
> >  {
> >  	struct eea_net *enet;
> >  	int err = -ENOMEM;
> >
> > +	if (edev->ha_reset)
> > +		return eea_net_reprobe(edev);
> > +
> >  	enet = eea_netdev_alloc(edev, edev->rx_num);
> >  	if (!enet)
> >  		return -ENOMEM;
> > @@ -168,6 +670,7 @@ int eea_net_probe(struct eea_device *edev)
> >  	if (err)
> >  		goto err_reset_dev;
> >
> > +	eea_update_ts_off(edev, enet);
> >  	netif_carrier_off(enet->netdev);
> >
> >  	netdev_dbg(enet->netdev, "eea probe success.\n");
> > @@ -179,10 +682,29 @@ int eea_net_probe(struct eea_device *edev)
> >  	eea_destroy_adminq(enet);
> >
> >  err_free_netdev:
> > +	eea_free_irq_blk(enet);
> >  	free_netdev(enet->netdev);
> >  	return err;
> >  }
> >
> > +static void eea_net_ha_reset_remove(struct eea_net *enet,
> > +				    struct eea_device *edev,
> > +				    struct net_device *netdev)
> > +{
> > +	rtnl_lock();
> > +	edev->ha_reset_netdev_running = false;
> > +	if (netif_running(enet->netdev)) {
> > +		eea_netdev_stop(enet->netdev);
> > +		enet->link_err = EEA_LINK_ERR_HA_RESET_DEV;
> > +		edev->ha_reset_netdev_running = true;
> > +	}
> > +	rtnl_unlock();
> > +
> > +	eea_device_reset(edev);
> > +	eea_destroy_adminq(enet);
> > +	eea_free_irq_blk(enet);
> > +}
> > +
> >  void eea_net_remove(struct eea_device *edev)
> >  {
> >  	struct net_device *netdev;
> > @@ -191,12 +713,16 @@ void eea_net_remove(struct eea_device *edev)
> >  	enet = edev->enet;
> >  	netdev = enet->netdev;
> >
> > +	if (edev->ha_reset) {
> > +		eea_net_ha_reset_remove(enet, edev, netdev);
> > +		return;
> > +	}
> > +
> >  	unregister_netdev(netdev);
> > -	netdev_dbg(enet->netdev, "eea removed.\n");
> >
> >  	eea_device_reset(edev);
> > -
> >  	eea_destroy_adminq(enet);
> > +	eea_free_irq_blk(enet);
> >
> >  	free_netdev(netdev);
> >  }
> > diff --git a/drivers/net/ethernet/alibaba/eea/eea_net.h b/drivers/net/ethernet/alibaba/eea/eea_net.h
> > index ab487bc88af2..0398e781dfdb 100644
> > --- a/drivers/net/ethernet/alibaba/eea/eea_net.h
> > +++ b/drivers/net/ethernet/alibaba/eea/eea_net.h
> > @@ -18,6 +18,8 @@
> >  #define EEA_VER_MINOR		0
> >  #define EEA_VER_SUB_MINOR	0
> >
> > +struct eea_tx_meta;
> > +
> >  struct eea_net_tx {
> >  	struct eea_net *enet;
> >
> > @@ -101,6 +103,18 @@ struct eea_net_cfg {
> >  	u8 tx_cq_desc_size;
> >
> >  	u32 split_hdr;
> > +
> > +	struct hwtstamp_config ts_cfg;
> > +};
> > +
> > +struct eea_net_init_ctx {
> > +	struct eea_net_cfg cfg;
> > +
> > +	struct eea_net_tx *tx;
> > +	struct eea_net_rx **rx;
> > +
> > +	struct net_device *netdev;
> > +	struct eea_device *edev;
> >  };
> >
> >  enum {
> > @@ -109,6 +123,17 @@ enum {
> >  	EEA_LINK_ERR_LINK_DOWN,
> >  };
> >
> > +struct eea_irq_blk {
> > +	struct napi_struct napi;
> > +	u16 msix_vec;
> > +	bool ready;
> > +	struct eea_net_rx *rx;
> > +	char irq_name[32];
> > +	int irq;
> > +	int idx;
> > +
> > +};
> > +
> >  struct eea_net {
> >  	struct eea_device *edev;
> >  	struct net_device *netdev;
> > @@ -121,6 +146,8 @@ struct eea_net {
> >  	struct eea_net_cfg cfg;
> >  	struct eea_net_cfg cfg_hw;
> >
> > +	struct eea_irq_blk *irq_blks;
> > +
> >  	u32 link_err;
> >
> >  	bool started;
> > @@ -134,4 +161,22 @@ struct eea_net {
> >  int eea_net_probe(struct eea_device *edev);
> >  void eea_net_remove(struct eea_device *edev);
> >
> > +int eea_reset_hw_resources(struct eea_net *enet, struct eea_net_init_ctx *ctx);
> > +void eea_init_ctx(struct eea_net *enet, struct eea_net_init_ctx *ctx);
> > +int eea_queues_check_and_reset(struct eea_device *edev);
> > +
> > +/* rx apis */
> > +void enet_rx_stop(struct eea_net_rx *rx);
> > +void enet_rx_start(struct eea_net_rx *rx);
> > +
> > +void eea_free_rx(struct eea_net_rx *rx, struct eea_net_cfg *cfg);
> > +struct eea_net_rx *eea_alloc_rx(struct eea_net_init_ctx *ctx, u32 idx);
> > +
> > +/* tx apis */
> > +int eea_poll_tx(struct eea_net_tx *tx, int budget);
> > +netdev_tx_t eea_tx_xmit(struct sk_buff *skb, struct net_device *netdev);
> > +
> > +void eea_free_tx(struct eea_net_tx *tx, struct eea_net_cfg *cfg);
> > +int eea_alloc_tx(struct eea_net_init_ctx *ctx, struct eea_net_tx *tx, u32 idx);
> > +
> >  #endif
> > diff --git a/drivers/net/ethernet/alibaba/eea/eea_pci.c b/drivers/net/ethernet/alibaba/eea/eea_pci.c
> > index 97efac753cfb..e42b0298eebb 100644
> > --- a/drivers/net/ethernet/alibaba/eea/eea_pci.c
> > +++ b/drivers/net/ethernet/alibaba/eea/eea_pci.c
> > @@ -13,6 +13,9 @@
> >
> >  #define EEA_PCI_DB_OFFSET 4096
> >
> > +#define EEA_PCI_CAP_RESET_DEVICE 0xFA
> > +#define EEA_PCI_CAP_RESET_FLAG BIT(1)
> > +
> >  struct eea_pci_cfg {
> >  	__le32 reserve0;
> >  	__le32 reserve1;
> > @@ -51,6 +54,7 @@ struct eea_pci_device {
> >  	void __iomem *reg;
> >  	void __iomem *db_base;
> >
> > +	struct work_struct ha_handle_work;
> >  	char ha_irq_name[32];
> >  	u8 reset_pos;
> >  };
> > @@ -67,6 +71,11 @@ struct eea_pci_device {
> >  #define cfg_read32(reg, item) ioread32(cfg_pointer(reg, item))
> >  #define cfg_readq(reg, item) readq(cfg_pointer(reg, item))
> >
> > +/* Due to circular references, we have to add function definitions here. */
> > +static int __eea_pci_probe(struct pci_dev *pci_dev,
> > +			   struct eea_pci_device *ep_dev);
> > +static void __eea_pci_remove(struct pci_dev *pci_dev, bool flush_ha_work);
> > +
> >  const char *eea_pci_name(struct eea_device *edev)
> >  {
> >  	return pci_name(edev->ep_dev->pci_dev);
> > @@ -250,6 +259,150 @@ void eea_pci_active_aq(struct eea_ring *ering, int msix_vec)
> >  				    cfg_read32(ep_dev->reg, aq_db_off));
> >  }
> >
> > +void eea_pci_free_irq(struct eea_irq_blk *blk)
> > +{
> > +	irq_update_affinity_hint(blk->irq, NULL);
> > +	free_irq(blk->irq, blk);
> > +}
> > +
> > +int eea_pci_request_irq(struct eea_device *edev, struct eea_irq_blk *blk,
> > +			irqreturn_t (*callback)(int irq, void *data))
> > +{
> > +	struct eea_pci_device *ep_dev = edev->ep_dev;
> > +	int irq;
> > +
> > +	snprintf(blk->irq_name, sizeof(blk->irq_name), "eea-q%d@%s", blk->idx,
> > +		 pci_name(ep_dev->pci_dev));
> > +
> > +	irq = pci_irq_vector(ep_dev->pci_dev, blk->msix_vec);
> > +
> > +	blk->irq = irq;
> > +
> > +	return request_irq(irq, callback, IRQF_NO_AUTOEN, blk->irq_name, blk);
> > +}
> > +
> > +static void eea_ha_handle_reset(struct eea_pci_device *ep_dev)
> > +{
> > +	struct eea_device *edev;
> > +	struct pci_dev *pci_dev;
> > +	u16 reset;
> > +	int err;
> > +
> > +	if (!ep_dev->reset_pos) {
> > +		eea_queues_check_and_reset(&ep_dev->edev);
> > +		return;
> > +	}
> > +
> > +	edev = &ep_dev->edev;
> > +
> > +	pci_read_config_word(ep_dev->pci_dev, ep_dev->reset_pos, &reset);
> > +
> > +	/* clear bit */
> > +	pci_write_config_word(ep_dev->pci_dev, ep_dev->reset_pos, 0xFFFF);
> > +
> > +	if (reset & EEA_PCI_CAP_RESET_FLAG) {
> > +		dev_warn(&ep_dev->pci_dev->dev, "recv device reset request.\n");
> > +
> > +		pci_dev = ep_dev->pci_dev;
> > +
> > +		/* The pci remove callback may hold this lock. If the
> > +		 * pci remove callback is called, then we can ignore the
> > +		 * ha interrupt.
> > +		 */
> > +		if (mutex_trylock(&edev->ha_lock)) {
> > +			edev->ha_reset = true;
> > +
> > +			__eea_pci_remove(pci_dev, false);
> > +			err = __eea_pci_probe(pci_dev, ep_dev);
> > +			if (err)
> > +				dev_err(&ep_dev->pci_dev->dev,
> > +					"ha: re-setup failed.\n");
>
> AI still notes:
> ---
> What happens if __eea_pci_probe() fails during HA reset recovery? Jakub
> Kicinski's AI review in v25 noted that when probe fails after remove
> succeeded, the device is left in a removed state with no error beyond this
> single dev_err() message.
>
> The function returns 1 (from the implicit flow) indicating success, even
> though reprobe failed and the device is now non-functional. Should this
> check
> for errors and at minimum log the failure state more prominently?
>
> Reference:
> https://lore.kernel.org/netdev/20260204040054.1698677-2-kuba@kernel.org/
> ---
>

next prev parent reply	other threads:[~2026-03-09  8:54 UTC|newest]

Thread overview: 13+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2026-03-02  2:45 [PATCH net-next v28 0/8] eea: Add basic driver framework for Alibaba Elastic Ethernet Adaptor Xuan Zhuo
2026-03-02  2:45 ` [PATCH net-next v28 1/8] eea: introduce PCI framework Xuan Zhuo
2026-03-02  2:45 ` [PATCH net-next v28 2/8] eea: introduce ring and descriptor structures Xuan Zhuo
2026-03-02  2:45 ` [PATCH net-next v28 3/8] eea: probe the netdevice and create adminq Xuan Zhuo
2026-03-06  2:44   ` [net-next,v28,3/8] " Jakub Kicinski
2026-03-02  2:46 ` [PATCH net-next v28 4/8] eea: create/destroy rx,tx queues for netdevice open and stop Xuan Zhuo
2026-03-05 10:16   ` Paolo Abeni
2026-03-09  8:51     ` Xuan Zhuo [this message]
2026-03-10  8:38       ` Paolo Abeni
2026-03-02  2:46 ` [PATCH net-next v28 5/8] eea: implement packet receive logic Xuan Zhuo
2026-03-02  2:46 ` [PATCH net-next v28 6/8] eea: implement packet transmit logic Xuan Zhuo
2026-03-02  2:46 ` [PATCH net-next v28 7/8] eea: introduce ethtool support Xuan Zhuo
2026-03-02  2:46 ` [PATCH net-next v28 8/8] eea: introduce callback for ndo_get_stats64 Xuan Zhuo

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=1773046268.140821-1-xuanzhuo@linux.alibaba.com \
    --to=xuanzhuo@linux.alibaba.com \
    --cc=andrew+netdev@lunn.ch \
    --cc=davem@davemloft.net \
    --cc=dong100@mucse.com \
    --cc=dust.li@linux.alibaba.com \
    --cc=edumazet@google.com \
    --cc=guwen@linux.alibaba.com \
    --cc=hkallweit1@gmail.com \
    --cc=kuba@kernel.org \
    --cc=lorenzo@kernel.org \
    --cc=lukas.bulwahn@redhat.com \
    --cc=lulie@linux.alibaba.com \
    --cc=netdev@vger.kernel.org \
    --cc=pabeni@redhat.com \
    --cc=vadim.fedorenko@linux.dev \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link

Be sure your reply has a Subject: header at the top and a blank line before the message body.

This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox