Intel-XE Archive on lore.kernel.org
 help / color / mirror / Atom feed
From: Rodrigo Vivi <rodrigo.vivi@intel.com>
To: Raag Jadav <raag.jadav@intel.com>
Cc: <intel-xe@lists.freedesktop.org>, <matthew.brost@intel.com>,
	<thomas.hellstrom@linux.intel.com>, <riana.tauro@intel.com>,
	<michal.wajdeczko@intel.com>, <matthew.d.roper@intel.com>,
	<michal.winiarski@intel.com>, <matthew.auld@intel.com>,
	<dev@lankhorst.se>, <jani.nikula@intel.com>,
	<lukasz.laguna@intel.com>, <zhanjun.dong@intel.com>,
	 <lukas@wunner.de>, <daniele.ceraolospurio@intel.com>,
	<badal.nilawar@intel.com>
Subject: Re: [PATCH v8 07/10] drm/xe/pm: Introduce xe_device_suspend/resume()
Date: Wed, 3 Jun 2026 06:58:27 -0400	[thread overview]
Message-ID: <aiAI00V5x5zWNAx2@intel.com> (raw)
In-Reply-To: <20260603101814.916948-8-raag.jadav@intel.com>

On Wed, Jun 03, 2026 at 03:47:07PM +0530, Raag Jadav wrote:
> PCIe FLR prepare/re-initialization flows pretty much reflect system
> suspend/resume flows with a few notable exceptions. Repurpose existing
> helpers for PCIe FLR with an explicit flag to distinguish between both
> flows.
> 
> Suggested-by: Daniele Ceraolo Spurio <daniele.ceraolospurio@intel.com>
> Signed-off-by: Raag Jadav <raag.jadav@intel.com>

neat!

Reviewed-by: Rodrigo Vivi <rodrigo.vivi@intel.com>

> ---
> v6: Repurpose system suspend/resume helpers for FLR (Daniele)
> ---
>  drivers/gpu/drm/xe/xe_device.c | 150 +++++++++++++++++++++++++++++++++
>  drivers/gpu/drm/xe/xe_device.h |   2 +
>  drivers/gpu/drm/xe/xe_pm.c     | 103 ++--------------------
>  3 files changed, 160 insertions(+), 95 deletions(-)
> 
> diff --git a/drivers/gpu/drm/xe/xe_device.c b/drivers/gpu/drm/xe/xe_device.c
> index d224861b6f6f..9e0cbad8adb0 100644
> --- a/drivers/gpu/drm/xe/xe_device.c
> +++ b/drivers/gpu/drm/xe/xe_device.c
> @@ -38,6 +38,7 @@
>  #include "xe_force_wake.h"
>  #include "xe_ggtt.h"
>  #include "xe_gt.h"
> +#include "xe_gt_idle.h"
>  #include "xe_gt_mcr.h"
>  #include "xe_gt_printk.h"
>  #include "xe_gt_sriov_vf.h"
> @@ -65,6 +66,7 @@
>  #include "xe_soc_remapper.h"
>  #include "xe_survivability_mode.h"
>  #include "xe_sriov.h"
> +#include "xe_sriov_vf_ccs.h"
>  #include "xe_svm.h"
>  #include "xe_sysctrl.h"
>  #include "xe_tile.h"
> @@ -1512,3 +1514,151 @@ struct xe_vm *xe_device_asid_to_vm(struct xe_device *xe, u32 asid)
>  
>  	return vm;
>  }
> +
> +/**
> + * xe_device_suspend() - Common helper for system suspend and FLR prepare
> + * @xe: xe device instance
> + * @flr: indicate FLR prepare
> + *
> + * Return: 0 on success, negative error code otherwise.
> + */
> +int xe_device_suspend(struct xe_device *xe, bool flr)
> +{
> +	struct xe_gt *gt;
> +	u8 id;
> +	int err;
> +
> +	err = xe_pxp_pm_suspend(xe->pxp);
> +	if (err)
> +		return err;
> +
> +	xe_late_bind_wait_for_worker_completion(&xe->late_bind);
> +
> +	for_each_gt(gt, xe, id)
> +		xe_gt_suspend_prepare(gt);
> +
> +	if (flr) {
> +		for_each_gt(gt, xe, id)
> +			xe_gt_flr_prepare(gt);
> +	} else {
> +		xe_display_pm_suspend(xe);
> +
> +		/* FIXME: Super racey... */
> +		err = xe_bo_evict_all(xe);
> +		if (err)
> +			goto err_display;
> +
> +		for_each_gt(gt, xe, id) {
> +			err = xe_gt_suspend(gt);
> +			if (err)
> +				goto err_display;
> +		}
> +	}
> +
> +	xe_irq_suspend(xe);
> +
> +	if (flr) {
> +		/* TODO: Drop all user bos */
> +		xe_bo_pci_dev_remove_pinned(xe);
> +
> +		unmap_mapping_range(xe->drm.anon_inode->i_mapping, 0, 0, 1);
> +	} else {
> +		xe_display_pm_suspend_late(xe);
> +
> +		xe_i2c_pm_suspend(xe);
> +	}
> +
> +	return 0;
> +
> +err_display:
> +	xe_display_pm_resume(xe);
> +	xe_pxp_pm_resume(xe->pxp);
> +	return err;
> +}
> +
> +/**
> + * xe_device_resume() - Common helper for System resume and re-initialization post FLR
> + * @xe: xe device instance
> + * @flr: indicate re-initialization post FLR
> + *
> + * Return: 0 on success
> + */
> +int xe_device_resume(struct xe_device *xe, bool flr)
> +{
> +	struct xe_tile *tile;
> +	struct xe_gt *gt;
> +	u8 id;
> +	int err;
> +
> +	for_each_gt(gt, xe, id)
> +		xe_gt_idle_disable_c6(gt);
> +
> +	for_each_tile(tile, xe, id)
> +		xe_wa_apply_tile_workarounds(tile);
> +
> +	err = xe_pcode_ready(xe, true);
> +	if (err)
> +		return err;
> +
> +	assert_lmem_ready(xe);
> +
> +	if (flr) {
> +		err = xe_bo_restore_map(xe);
> +		if (err)
> +			return err;
> +
> +		for_each_gt(gt, xe, id) {
> +			err = xe_gt_reinit(gt);
> +			if (err)
> +				return err;
> +		}
> +	} else {
> +		xe_display_pm_resume_early(xe);
> +
> +		/*
> +		 * This only restores pinned memory which is the memory required for the
> +		 * GT(s) to resume.
> +		 */
> +		err = xe_bo_restore_early(xe);
> +		if (err)
> +			return err;
> +	}
> +
> +	xe_i2c_pm_resume(xe, true);
> +
> +	xe_sysctrl_pm_resume(xe);
> +
> +	xe_irq_resume(xe);
> +
> +	for_each_gt(gt, xe, id) {
> +		err = xe_gt_resume(gt);
> +		if (err)
> +			break;
> +	}
> +
> +	if (flr) {
> +		if (err)
> +			return err;
> +	} else {
> +		/*
> +		 * Try to bring up display before bailing from GT resume failure,
> +		 * so we don't leave the user clueless with a blank screen.
> +		 */
> +		xe_display_pm_resume(xe);
> +		if (err)
> +			return err;
> +
> +		err = xe_bo_restore_late(xe);
> +		if (err)
> +			return err;
> +
> +		if (IS_VF_CCS_READY(xe))
> +			xe_sriov_vf_ccs_register_context(xe);
> +	}
> +
> +	xe_pxp_pm_resume(xe->pxp);
> +
> +	xe_late_bind_fw_load(&xe->late_bind);
> +
> +	return 0;
> +}
> diff --git a/drivers/gpu/drm/xe/xe_device.h b/drivers/gpu/drm/xe/xe_device.h
> index 975768a6a9c8..d61fdb362f91 100644
> --- a/drivers/gpu/drm/xe/xe_device.h
> +++ b/drivers/gpu/drm/xe/xe_device.h
> @@ -48,7 +48,9 @@ int xe_device_init_early(struct xe_device *xe);
>  int xe_device_probe_early(struct xe_device *xe);
>  int xe_device_probe(struct xe_device *xe);
>  void xe_device_remove(struct xe_device *xe);
> +int xe_device_resume(struct xe_device *xe, bool flr);
>  void xe_device_shutdown(struct xe_device *xe);
> +int xe_device_suspend(struct xe_device *xe, bool flr);
>  
>  void xe_device_wmb(struct xe_device *xe);
>  
> diff --git a/drivers/gpu/drm/xe/xe_pm.c b/drivers/gpu/drm/xe/xe_pm.c
> index 99562f691080..161d3f36f372 100644
> --- a/drivers/gpu/drm/xe/xe_pm.c
> +++ b/drivers/gpu/drm/xe/xe_pm.c
> @@ -172,52 +172,18 @@ static void xe_rpm_lockmap_release(const struct xe_device *xe)
>   */
>  int xe_pm_suspend(struct xe_device *xe)
>  {
> -	struct xe_gt *gt;
> -	u8 id;
>  	int err;
>  
>  	drm_dbg(&xe->drm, "Suspending device\n");
>  	xe_pm_block_begin_signalling();
>  	trace_xe_pm_suspend(xe, __builtin_return_address(0));
>  
> -	err = xe_pxp_pm_suspend(xe->pxp);
> +	err = xe_device_suspend(xe, false);
>  	if (err)
> -		goto err;
> +		drm_dbg(&xe->drm, "Device suspend failed %d\n", err);
> +	else
> +		drm_dbg(&xe->drm, "Device suspended\n");
>  
> -	xe_late_bind_wait_for_worker_completion(&xe->late_bind);
> -
> -	for_each_gt(gt, xe, id)
> -		xe_gt_suspend_prepare(gt);
> -
> -	xe_display_pm_suspend(xe);
> -
> -	/* FIXME: Super racey... */
> -	err = xe_bo_evict_all(xe);
> -	if (err)
> -		goto err_display;
> -
> -	for_each_gt(gt, xe, id) {
> -		err = xe_gt_suspend(gt);
> -		if (err)
> -			goto err_display;
> -	}
> -
> -	xe_irq_suspend(xe);
> -
> -	xe_display_pm_suspend_late(xe);
> -
> -	xe_i2c_pm_suspend(xe);
> -
> -	drm_dbg(&xe->drm, "Device suspended\n");
> -	xe_pm_block_end_signalling();
> -
> -	return 0;
> -
> -err_display:
> -	xe_display_pm_resume(xe);
> -	xe_pxp_pm_resume(xe->pxp);
> -err:
> -	drm_dbg(&xe->drm, "Device suspend failed %d\n", err);
>  	xe_pm_block_end_signalling();
>  	return err;
>  }
> @@ -230,71 +196,18 @@ int xe_pm_suspend(struct xe_device *xe)
>   */
>  int xe_pm_resume(struct xe_device *xe)
>  {
> -	struct xe_tile *tile;
> -	struct xe_gt *gt;
> -	u8 id;
>  	int err;
>  
>  	xe_pm_block_begin_signalling();
>  	drm_dbg(&xe->drm, "Resuming device\n");
>  	trace_xe_pm_resume(xe, __builtin_return_address(0));
>  
> -	for_each_gt(gt, xe, id)
> -		xe_gt_idle_disable_c6(gt);
> -
> -	for_each_tile(tile, xe, id)
> -		xe_wa_apply_tile_workarounds(tile);
> -
> -	err = xe_pcode_ready(xe, true);
> -	if (err)
> -		return err;
> -
> -	xe_display_pm_resume_early(xe);
> -
> -	/*
> -	 * This only restores pinned memory which is the memory required for the
> -	 * GT(s) to resume.
> -	 */
> -	err = xe_bo_restore_early(xe);
> -	if (err)
> -		goto err;
> -
> -	xe_i2c_pm_resume(xe, true);
> -
> -	xe_sysctrl_pm_resume(xe);
> -
> -	xe_irq_resume(xe);
> -
> -	for_each_gt(gt, xe, id) {
> -		err = xe_gt_resume(gt);
> -		if (err)
> -			break;
> -	}
> -
> -	/*
> -	 * Try to bring up display before bailing from GT resume failure,
> -	 * so we don't leave the user clueless with a blank screen.
> -	 */
> -	xe_display_pm_resume(xe);
> -	if (err)
> -		goto err;
> -
> -	err = xe_bo_restore_late(xe);
> +	err = xe_device_resume(xe, false);
>  	if (err)
> -		goto err;
> -
> -	xe_pxp_pm_resume(xe->pxp);
> -
> -	if (IS_VF_CCS_READY(xe))
> -		xe_sriov_vf_ccs_register_context(xe);
> -
> -	xe_late_bind_fw_load(&xe->late_bind);
> +		drm_dbg(&xe->drm, "Device resume failed %d\n", err);
> +	else
> +		drm_dbg(&xe->drm, "Device resumed\n");
>  
> -	drm_dbg(&xe->drm, "Device resumed\n");
> -	xe_pm_block_end_signalling();
> -	return 0;
> -err:
> -	drm_dbg(&xe->drm, "Device resume failed %d\n", err);
>  	xe_pm_block_end_signalling();
>  	return err;
>  }
> -- 
> 2.43.0
> 

  reply	other threads:[~2026-06-03 10:58 UTC|newest]

Thread overview: 20+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2026-06-03 10:17 [PATCH v8 00/10] Introduce Xe PCIe FLR Raag Jadav
2026-06-03 10:17 ` [PATCH v8 01/10] drm/xe/uc_fw: Allow re-initializing firmware Raag Jadav
2026-06-03 10:17 ` [PATCH v8 02/10] drm/xe/guc_submit: Introduce guc_exec_queue_reinit_kernel() Raag Jadav
2026-06-03 10:17 ` [PATCH v8 03/10] drm/xe/gt: Introduce FLR helpers Raag Jadav
2026-06-03 10:17 ` [PATCH v8 04/10] drm/xe/bo_evict: Introduce xe_bo_restore_map() Raag Jadav
2026-06-03 10:17 ` [PATCH v8 05/10] drm/xe/exec_queue: Introduce xe_exec_queue_reinit() Raag Jadav
2026-06-03 10:17 ` [PATCH v8 06/10] drm/xe/migrate: Introduce xe_migrate_reinit() Raag Jadav
2026-06-03 10:17 ` [PATCH v8 07/10] drm/xe/pm: Introduce xe_device_suspend/resume() Raag Jadav
2026-06-03 10:58   ` Rodrigo Vivi [this message]
2026-06-03 10:17 ` [PATCH v8 08/10] drm/xe: Improve wedged state management Raag Jadav
2026-06-03 10:56   ` Rodrigo Vivi
2026-06-04  6:52     ` Tauro, Riana
2026-06-04  8:39       ` Raag Jadav
2026-06-03 10:17 ` [PATCH v8 09/10] drm/xe/pci: Introduce PCIe FLR Raag Jadav
2026-06-03 10:40   ` Rodrigo Vivi
2026-06-03 10:17 ` [PATCH v8 10/10] drm/xe/doc: Wire up PCI Error Handling Raag Jadav
2026-06-03 10:28 ` ✗ CI.checkpatch: warning for Introduce Xe PCIe FLR (rev8) Patchwork
2026-06-03 10:29 ` ✓ CI.KUnit: success " Patchwork
2026-06-03 11:11 ` ✓ Xe.CI.BAT: " Patchwork
2026-06-03 22:55 ` ✓ Xe.CI.FULL: " Patchwork

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=aiAI00V5x5zWNAx2@intel.com \
    --to=rodrigo.vivi@intel.com \
    --cc=badal.nilawar@intel.com \
    --cc=daniele.ceraolospurio@intel.com \
    --cc=dev@lankhorst.se \
    --cc=intel-xe@lists.freedesktop.org \
    --cc=jani.nikula@intel.com \
    --cc=lukas@wunner.de \
    --cc=lukasz.laguna@intel.com \
    --cc=matthew.auld@intel.com \
    --cc=matthew.brost@intel.com \
    --cc=matthew.d.roper@intel.com \
    --cc=michal.wajdeczko@intel.com \
    --cc=michal.winiarski@intel.com \
    --cc=raag.jadav@intel.com \
    --cc=riana.tauro@intel.com \
    --cc=thomas.hellstrom@linux.intel.com \
    --cc=zhanjun.dong@intel.com \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox