All of lore.kernel.org
 help / color / mirror / Atom feed
From: Matthew Brost <matthew.brost@intel.com>
To: "José Roberto de Souza" <jose.souza@intel.com>
Cc: <intel-xe@lists.freedesktop.org>
Subject: Re: [PATCH] drm/xe: Force write completion of MI_STORE_DATA_IMM
Date: Tue, 17 Dec 2024 15:39:42 -0800	[thread overview]
Message-ID: <Z2ILvmX9y87iFvZP@lstrano-desk.jf.intel.com> (raw)
In-Reply-To: <20241217160732.46280-1-jose.souza@intel.com>

On Tue, Dec 17, 2024 at 08:07:32AM -0800, José Roberto de Souza wrote:
> With Force write completion unset there is no guarantees of when the
> write will be globally visible what is not the behavior wanted.
> 

Do we want this backported? If so, maybe add a fixes?

Matt

> Signed-off-by: José Roberto de Souza <jose.souza@intel.com>
> ---
>  drivers/gpu/drm/xe/instructions/xe_mi_commands.h | 13 +++++++------
>  drivers/gpu/drm/xe/xe_migrate.c                  | 11 ++++++++---
>  drivers/gpu/drm/xe/xe_oa.c                       |  4 +++-
>  drivers/gpu/drm/xe/xe_ring_ops.c                 |  6 ++++--
>  4 files changed, 22 insertions(+), 12 deletions(-)
> 
> diff --git a/drivers/gpu/drm/xe/instructions/xe_mi_commands.h b/drivers/gpu/drm/xe/instructions/xe_mi_commands.h
> index 10ec2920d31b3..f4ee910f09432 100644
> --- a/drivers/gpu/drm/xe/instructions/xe_mi_commands.h
> +++ b/drivers/gpu/drm/xe/instructions/xe_mi_commands.h
> @@ -33,12 +33,13 @@
>  #define MI_TOPOLOGY_FILTER		__MI_INSTR(0xD)
>  #define MI_FORCE_WAKEUP			__MI_INSTR(0x1D)
>  
> -#define MI_STORE_DATA_IMM		__MI_INSTR(0x20)
> -#define   MI_SDI_GGTT			REG_BIT(22)
> -#define   MI_SDI_LEN_DW			GENMASK(9, 0)
> -#define   MI_SDI_NUM_DW(x)		REG_FIELD_PREP(MI_SDI_LEN_DW, (x) + 3 - 2)
> -#define   MI_SDI_NUM_QW(x)		(REG_FIELD_PREP(MI_SDI_LEN_DW, 2 * (x) + 3 - 2) | \
> -					 REG_BIT(21))
> +#define MI_STORE_DATA_IMM			__MI_INSTR(0x20)
> +#define   MI_SDI_GGTT				REG_BIT(22)
> +#define   MI_FORCE_WRITE_COMPLETION_CHECK	REG_BIT(10)
> +#define   MI_SDI_LEN_DW				GENMASK(9, 0)
> +#define   MI_SDI_NUM_DW(x)			REG_FIELD_PREP(MI_SDI_LEN_DW, (x) + 3 - 2)
> +#define   MI_SDI_NUM_QW(x)			(REG_FIELD_PREP(MI_SDI_LEN_DW, 2 * (x) + 3 - 2) | \
> +						 REG_BIT(21))
>  
>  #define MI_LOAD_REGISTER_IMM		__MI_INSTR(0x22)
>  #define   MI_LRI_LRM_CS_MMIO		REG_BIT(19)
> diff --git a/drivers/gpu/drm/xe/xe_migrate.c b/drivers/gpu/drm/xe/xe_migrate.c
> index 1b97d90aaddaf..8b32fad678782 100644
> --- a/drivers/gpu/drm/xe/xe_migrate.c
> +++ b/drivers/gpu/drm/xe/xe_migrate.c
> @@ -581,7 +581,9 @@ static void emit_pte(struct xe_migrate *m,
>  	while (ptes) {
>  		u32 chunk = min(MAX_PTE_PER_SDI, ptes);
>  
> -		bb->cs[bb->len++] = MI_STORE_DATA_IMM | MI_SDI_NUM_QW(chunk);
> +		bb->cs[bb->len++] = MI_STORE_DATA_IMM |
> +				    MI_FORCE_WRITE_COMPLETION_CHECK |
> +				    MI_SDI_NUM_QW(chunk);
>  		bb->cs[bb->len++] = ofs;
>  		bb->cs[bb->len++] = 0;
>  
> @@ -1223,7 +1225,9 @@ static void write_pgtable(struct xe_tile *tile, struct xe_bb *bb, u64 ppgtt_ofs,
>  		if (!(bb->len & 1))
>  			bb->cs[bb->len++] = MI_NOOP;
>  
> -		bb->cs[bb->len++] = MI_STORE_DATA_IMM | MI_SDI_NUM_QW(chunk);
> +		bb->cs[bb->len++] = MI_STORE_DATA_IMM |
> +				    MI_FORCE_WRITE_COMPLETION_CHECK |
> +				    MI_SDI_NUM_QW(chunk);
>  		bb->cs[bb->len++] = lower_32_bits(addr);
>  		bb->cs[bb->len++] = upper_32_bits(addr);
>  		if (pt_op->bind)
> @@ -1388,7 +1392,8 @@ __xe_migrate_update_pgtables(struct xe_migrate *m,
>  			u32 idx = 0;
>  
>  			bb->cs[bb->len++] = MI_STORE_DATA_IMM |
> -				MI_SDI_NUM_QW(chunk);
> +					    MI_FORCE_WRITE_COMPLETION_CHECK |
> +					    MI_SDI_NUM_QW(chunk);
>  			bb->cs[bb->len++] = ofs;
>  			bb->cs[bb->len++] = 0; /* upper_32_bits */
>  
> diff --git a/drivers/gpu/drm/xe/xe_oa.c b/drivers/gpu/drm/xe/xe_oa.c
> index 56bf375a9d4bc..ae94490b0eac8 100644
> --- a/drivers/gpu/drm/xe/xe_oa.c
> +++ b/drivers/gpu/drm/xe/xe_oa.c
> @@ -690,7 +690,9 @@ static void xe_oa_store_flex(struct xe_oa_stream *stream, struct xe_lrc *lrc,
>  	u32 offset = xe_bo_ggtt_addr(lrc->bo);
>  
>  	do {
> -		bb->cs[bb->len++] = MI_STORE_DATA_IMM | MI_SDI_GGTT | MI_SDI_NUM_DW(1);
> +		bb->cs[bb->len++] = MI_STORE_DATA_IMM | MI_SDI_GGTT |
> +				    MI_FORCE_WRITE_COMPLETION_CHECK |
> +				    MI_SDI_NUM_DW(1);
>  		bb->cs[bb->len++] = offset + flex->offset * sizeof(u32);
>  		bb->cs[bb->len++] = 0;
>  		bb->cs[bb->len++] = flex->value;
> diff --git a/drivers/gpu/drm/xe/xe_ring_ops.c b/drivers/gpu/drm/xe/xe_ring_ops.c
> index 0be4f489d3e12..3a75a08b6be92 100644
> --- a/drivers/gpu/drm/xe/xe_ring_ops.c
> +++ b/drivers/gpu/drm/xe/xe_ring_ops.c
> @@ -72,7 +72,8 @@ static int emit_user_interrupt(u32 *dw, int i)
>  
>  static int emit_store_imm_ggtt(u32 addr, u32 value, u32 *dw, int i)
>  {
> -	dw[i++] = MI_STORE_DATA_IMM | MI_SDI_GGTT | MI_SDI_NUM_DW(1);
> +	dw[i++] = MI_STORE_DATA_IMM | MI_SDI_GGTT |
> +		  MI_FORCE_WRITE_COMPLETION_CHECK | MI_SDI_NUM_DW(1);
>  	dw[i++] = addr;
>  	dw[i++] = 0;
>  	dw[i++] = value;
> @@ -162,7 +163,8 @@ static int emit_pipe_invalidate(u32 mask_flags, bool invalidate_tlb, u32 *dw,
>  static int emit_store_imm_ppgtt_posted(u64 addr, u64 value,
>  				       u32 *dw, int i)
>  {
> -	dw[i++] = MI_STORE_DATA_IMM | MI_SDI_NUM_QW(1);
> +	dw[i++] = MI_STORE_DATA_IMM | MI_FORCE_WRITE_COMPLETION_CHECK |
> +		  MI_SDI_NUM_QW(1);
>  	dw[i++] = lower_32_bits(addr);
>  	dw[i++] = upper_32_bits(addr);
>  	dw[i++] = lower_32_bits(value);
> -- 
> 2.47.1
> 

  parent reply	other threads:[~2024-12-17 23:39 UTC|newest]

Thread overview: 17+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2024-12-17 16:07 [PATCH] drm/xe: Force write completion of MI_STORE_DATA_IMM José Roberto de Souza
2024-12-17 17:36 ` Dixit, Ashutosh
2024-12-17 21:58 ` ✓ CI.Patch_applied: success for " Patchwork
2024-12-17 21:58 ` ✓ CI.checkpatch: " Patchwork
2024-12-17 21:59 ` ✓ CI.KUnit: " Patchwork
2024-12-17 22:17 ` ✓ CI.Build: " Patchwork
2024-12-17 22:20 ` ✓ CI.Hooks: " Patchwork
2024-12-17 22:21 ` ✓ CI.checksparse: " Patchwork
2024-12-17 22:59 ` ✓ Xe.CI.BAT: " Patchwork
2024-12-17 23:39 ` Matthew Brost [this message]
2024-12-18 15:38   ` [PATCH] " Souza, Jose
2024-12-18 17:27     ` Matthew Brost
2024-12-19  2:05       ` Dixit, Ashutosh
2024-12-19 13:58         ` Souza, Jose
2024-12-19 16:05           ` Dixit, Ashutosh
2024-12-23 15:14       ` Thomas Hellström
2024-12-18  9:07 ` ✗ Xe.CI.Full: failure for " Patchwork

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=Z2ILvmX9y87iFvZP@lstrano-desk.jf.intel.com \
    --to=matthew.brost@intel.com \
    --cc=intel-xe@lists.freedesktop.org \
    --cc=jose.souza@intel.com \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line before the message body.
This is an external index of several public inboxes,
see mirroring instructions on how to clone and mirror
all data and code used by this external index.