From: Daniele Ceraolo Spurio <daniele.ceraolospurio@intel.com>
To: Arkadiusz Hiler <arkadiusz.hiler@intel.com>,
intel-gfx@lists.freedesktop.org
Subject: Re: [PATCH 3/5] drm/i915/guc: Simplify intel_guc_load()
Date: Thu, 15 Dec 2016 14:26:29 -0800 [thread overview]
Message-ID: <dff2b343-a3ab-c45b-ff01-c7e326346537@intel.com> (raw)
In-Reply-To: <20161215154708.31521-4-arkadiusz.hiler@intel.com>
On 15/12/16 07:47, Arkadiusz Hiler wrote:
> Current version of intel_guc_load() does a lot:
> - cares about submission
> - loads huc
> - implement WA
>
> This change offloads some of the logic to intel_uc_load(), which now
> cares about the above.
>
> Cc: Anusha Srivatsa <anusha.srivatsa@intel.com>
> Cc: Jeff McGee <jeff.mcgee@intel.com>
> Cc: Michal Winiarski <michal.winiarski@intel.com>
> Signed-off-by: Arkadiusz Hiler <arkadiusz.hiler@intel.com>
> ---
> drivers/gpu/drm/i915/i915_gem.c | 2 +-
> drivers/gpu/drm/i915/intel_guc_loader.c | 126 +++++---------------------------
> drivers/gpu/drm/i915/intel_uc.c | 83 +++++++++++++++++++++
> drivers/gpu/drm/i915/intel_uc.h | 8 ++
> 4 files changed, 110 insertions(+), 109 deletions(-)
>
> diff --git a/drivers/gpu/drm/i915/i915_gem.c b/drivers/gpu/drm/i915/i915_gem.c
> index 6af4e85..76b52c6 100644
> --- a/drivers/gpu/drm/i915/i915_gem.c
> +++ b/drivers/gpu/drm/i915/i915_gem.c
> @@ -4412,7 +4412,7 @@ i915_gem_init_hw(struct drm_i915_private *dev_priv)
> intel_mocs_init_l3cc_table(dev_priv);
>
> /* We can't enable contexts until all firmware is loaded */
> - ret = intel_guc_load(dev_priv);
> + ret = intel_uc_load(dev_priv);
> if (ret)
> goto out;
>
> diff --git a/drivers/gpu/drm/i915/intel_guc_loader.c b/drivers/gpu/drm/i915/intel_guc_loader.c
> index f8b28b1..b76b556 100644
> --- a/drivers/gpu/drm/i915/intel_guc_loader.c
> +++ b/drivers/gpu/drm/i915/intel_guc_loader.c
> @@ -97,7 +97,7 @@ const char *intel_guc_fw_status_repr(enum intel_guc_fw_status status)
> }
> };
>
> -static void guc_interrupts_release(struct drm_i915_private *dev_priv)
> +void guc_interrupts_release(struct drm_i915_private *dev_priv)
> {
> struct intel_engine_cs *engine;
> enum intel_engine_id id;
> @@ -115,7 +115,7 @@ static void guc_interrupts_release(struct drm_i915_private *dev_priv)
> I915_WRITE(GUC_WD_VECS_IER, 0);
> }
>
> -static void guc_interrupts_capture(struct drm_i915_private *dev_priv)
> +void guc_interrupts_capture(struct drm_i915_private *dev_priv)
> {
> struct intel_engine_cs *engine;
> enum intel_engine_id id;
> @@ -334,7 +334,7 @@ static int guc_ucode_xfer_dma(struct drm_i915_private *dev_priv,
> return ret;
> }
>
> -static u32 guc_wopcm_size(struct drm_i915_private *dev_priv)
> +u32 guc_wopcm_size(struct drm_i915_private *dev_priv)
> {
> u32 wopcm_size = GUC_WOPCM_TOP;
>
> @@ -417,7 +417,7 @@ static int guc_ucode_xfer(struct drm_i915_private *dev_priv)
> return ret;
> }
>
> -static int guc_hw_reset(struct drm_i915_private *dev_priv)
> +int guc_hw_reset(struct drm_i915_private *dev_priv)
If I haven't missed anything, guc_hw_reset is only called in 1 place, so
we could keep the function static and move it to intel_uc.c.
> {
> int ret;
> u32 guc_status;
> @@ -452,75 +452,37 @@ int intel_guc_load(struct drm_i915_private *dev_priv)
> {
> struct intel_guc_fw *guc_fw = &dev_priv->guc.guc_fw;
> const char *fw_path = guc_fw->guc_fw_path;
> - int retries, ret, err;
> + int ret;
>
> DRM_DEBUG_DRIVER("GuC fw status: path %s, fetch %s, load %s\n",
> fw_path,
> intel_guc_fw_status_repr(guc_fw->guc_fw_fetch_status),
> intel_guc_fw_status_repr(guc_fw->guc_fw_load_status));
>
> - /* Loading forbidden, or no firmware to load? */
> - if (!i915.enable_guc_loading) {
> - err = 0;
> - goto fail;
> - } else if (fw_path == NULL) {
> + if (fw_path == NULL) {
> /* Device is known to have no uCode (e.g. no GuC) */
> - err = -ENXIO;
> - goto fail;
> + return -ENXIO;
> } else if (*fw_path == '\0') {
> /* Device has a GuC but we don't know what f/w to load? */
> WARN(1, "No GuC firmware known for this platform!\n");
> - err = -ENODEV;
> - goto fail;
> + return -ENODEV;
> }
>
> /* Fetch failed, or already fetched but failed to load? */
> if (guc_fw->guc_fw_fetch_status != GUC_FIRMWARE_SUCCESS) {
> - err = -EIO;
> - goto fail;
> + return -EIO;
> } else if (guc_fw->guc_fw_load_status == GUC_FIRMWARE_FAIL) {
> - err = -ENOEXEC;
> - goto fail;
> + return -ENOEXEC;
> }
>
> - guc_interrupts_release(dev_priv);
> - gen9_reset_guc_interrupts(dev_priv);
> -
> guc_fw->guc_fw_load_status = GUC_FIRMWARE_PENDING;
>
> - DRM_DEBUG_DRIVER("GuC fw status: fetch %s, load %s\n",
> - intel_guc_fw_status_repr(guc_fw->guc_fw_fetch_status),
> - intel_guc_fw_status_repr(guc_fw->guc_fw_load_status));
> -
> - err = i915_guc_submission_init(dev_priv);
> - if (err)
> - goto fail;
> -
> - /*
> - * WaEnableuKernelHeaderValidFix:skl,bxt
> - * For BXT, this is only upto B0 but below WA is required for later
> - * steppings also so this is extended as well.
> - */
This comment is removed, but the WA is applicable to all SKL steppings
and is also applicable to HuC according to the specs so I suggest to
retain the comment and move it to intel_uc_load().
> /* WaEnableGuCBootHashCheckNotSet:skl,bxt */
The implementation of this WA is now outside this function and it is
marked as such there. I'd personally prefer to remove this comment from
here as it might cause confusion, but no strong feelings either way.
> - for (retries = 3; ; ) {
> - /*
> - * Always reset the GuC just before (re)loading, so
> - * that the state and timing are fairly predictable
> - */
> - err = guc_hw_reset(dev_priv);
> - if (err)
> - goto fail;
> + /* we may want to retry guc ucode transfer */
> + ret = guc_ucode_xfer(dev_priv);
>
> - err = guc_ucode_xfer(dev_priv);
> - if (!err)
> - break;
> -
> - if (--retries == 0)
> - goto fail;
> -
> - DRM_INFO("GuC fw load failed: %d; will reset and "
> - "retry %d more time(s)\n", err, retries);
> - }
> + if (ret)
> + return -EAGAIN;
>
> guc_fw->guc_fw_load_status = GUC_FIRMWARE_SUCCESS;
>
> @@ -528,63 +490,7 @@ int intel_guc_load(struct drm_i915_private *dev_priv)
> intel_guc_fw_status_repr(guc_fw->guc_fw_fetch_status),
> intel_guc_fw_status_repr(guc_fw->guc_fw_load_status));
>
> - if (i915.enable_guc_submission) {
> - if (i915.guc_log_level >= 0)
> - gen9_enable_guc_interrupts(dev_priv);
> -
> - err = i915_guc_submission_enable(dev_priv);
> - if (err)
> - goto fail;
> - guc_interrupts_capture(dev_priv);
> - }
> -
> return 0;
> -
> -fail:
> - if (guc_fw->guc_fw_load_status == GUC_FIRMWARE_PENDING)
> - guc_fw->guc_fw_load_status = GUC_FIRMWARE_FAIL;
> -
> - guc_interrupts_release(dev_priv);
> - i915_guc_submission_disable(dev_priv);
> - i915_guc_submission_fini(dev_priv);
> -
> - /*
> - * We've failed to load the firmware :(
> - *
> - * Decide whether to disable GuC submission and fall back to
> - * execlist mode, and whether to hide the error by returning
> - * zero or to return -EIO, which the caller will treat as a
> - * nonfatal error (i.e. it doesn't prevent driver load, but
> - * marks the GPU as wedged until reset).
> - */
> - if (i915.enable_guc_loading > 1) {
> - ret = -EIO;
> - } else if (i915.enable_guc_submission > 1) {
> - ret = -EIO;
> - } else {
> - ret = 0;
> - }
> -
> - if (err == 0 && !HAS_GUC_UCODE(dev_priv))
> - ; /* Don't mention the GuC! */
> - else if (err == 0)
> - DRM_INFO("GuC firmware load skipped\n");
> - else if (ret != -EIO)
> - DRM_NOTE("GuC firmware load failed: %d\n", err);
> - else
> - DRM_WARN("GuC firmware load failed: %d\n", err);
> -
> - if (i915.enable_guc_submission) {
> - if (fw_path == NULL)
> - DRM_INFO("GuC submission without firmware not supported\n");
> - if (ret == 0)
> - DRM_NOTE("Falling back from GuC submission to execlist mode\n");
> - else
> - DRM_ERROR("GuC init failed: %d\n", ret);
> - }
> - i915.enable_guc_submission = 0;
> -
> - return ret;
> }
>
> static void guc_fw_fetch(struct drm_i915_private *dev_priv,
> @@ -757,6 +663,10 @@ void intel_guc_init(struct drm_i915_private *dev_priv)
> guc_fw->guc_fw_fetch_status = GUC_FIRMWARE_NONE;
> guc_fw->guc_fw_load_status = GUC_FIRMWARE_NONE;
>
> + /* can't enable guc submission without guc */
> + if (!i915.enable_guc_loading)
> + i915.enable_guc_submission = 0;
> +
> /* Early (and silent) return if GuC loading is disabled */
> if (!i915.enable_guc_loading)
> return;
> diff --git a/drivers/gpu/drm/i915/intel_uc.c b/drivers/gpu/drm/i915/intel_uc.c
> index 8eec035..4e184edb 100644
> --- a/drivers/gpu/drm/i915/intel_uc.c
> +++ b/drivers/gpu/drm/i915/intel_uc.c
> @@ -35,6 +35,89 @@ void intel_uc_init(struct drm_i915_private *dev_priv)
> intel_guc_init(dev_priv);
> }
>
> +int intel_uc_load(struct drm_i915_private *dev_priv)
> +{
> + struct intel_guc_fw *guc_fw = &dev_priv->guc.guc_fw;
> + int ret, retries;
> +
> + /* guc not enabled, nothing to do */
> + if (!i915.enable_guc_loading)
> + return 0;
> +
> + guc_interrupts_release(dev_priv);
> + gen9_reset_guc_interrupts(dev_priv);
> +
> + guc_fw->guc_fw_load_status = GUC_FIRMWARE_PENDING;
> +
> + if (i915.enable_guc_submission) {
> + ret = i915_guc_submission_init(dev_priv);
> + if (ret)
> + goto fail;
> + }
> +
> + /* WaEnableGuCBootHashCheckNotSet:skl,bxt */
> + retries = GUC_WA_HASH_CHECK_NOT_SET_ATTEPMTS;
> + while (retries--) {
> + /*
> + * Always reset the GuC just before (re)loading, so
> + * that the state and timing are fairly predictable
> + */
> + ret = guc_hw_reset(dev_priv);
> + if (ret)
> + goto fail;
> +
> + ret = intel_guc_load(dev_priv);
> + if (ret == 0 || ret != -EAGAIN)
> + break;
> +
> + DRM_INFO("GuC fw load failed: %d; will reset and "
> + "retry %d more time(s)\n", ret, retries);
> + }
> +
> + /* did we succeded or run out of retries? */
> + if (ret)
> + goto fail;
> +
> + if (i915.enable_guc_submission) {
> + if (i915.guc_log_level >= 0)
> + gen9_enable_guc_interrupts(dev_priv);
> +
> + ret = i915_guc_submission_enable(dev_priv);
> + if (ret)
> + goto fail;
> + guc_interrupts_capture(dev_priv);
> + }
> +
> + return 0;
> +
> +fail:
> + /*
> + * We've failed to load the firmware :(
> + *
> + * Decide whether to disable GuC submission and fall back to
> + * execlist mode, and whether to hide the error by returning
> + * zero or to return -EIO, which the caller will treat as a
> + * nonfatal error (i.e. it doesn't prevent driver load, but
> + * marks the GPU as wedged until reset).
> + */
> + if (i915.enable_guc_loading > 1 || i915.enable_guc_submission > 1)
> + ret = -EIO;
> + else
> + ret = 0;
> +
> + if (i915.enable_guc_submission) {
> + i915.enable_guc_submission = 0;
> + DRM_INFO("GuC submission without firmware not supported\n");
> + DRM_NOTE("Falling back from GuC submission to execlist mode\n");
If i915.enable_guc_submission > 1 we will mark the GPU as wedged so it
might be worth retaining an error level message here in that scenario.
Apart from the minor comments above, the code re-org looks sensible (and
required :)) and the patch lgtm.
Thanks,
Daniele
> + }
> +
> + guc_interrupts_release(dev_priv);
> + i915_guc_submission_disable(dev_priv);
> + i915_guc_submission_fini(dev_priv);
> +
> + return ret;
> +}
> +
> /*
> * Read GuC command/status register (SOFT_SCRATCH_0)
> * Return true if it contains a response rather than a command
> diff --git a/drivers/gpu/drm/i915/intel_uc.h b/drivers/gpu/drm/i915/intel_uc.h
> index ec1a5b2..89c7e1f 100644
> --- a/drivers/gpu/drm/i915/intel_uc.h
> +++ b/drivers/gpu/drm/i915/intel_uc.h
> @@ -28,6 +28,9 @@
> #include "i915_guc_reg.h"
> #include "intel_ringbuffer.h"
>
> +/* WaEnableGuCBootHashCheckNotSet:skl,bxt */
> +#define GUC_WA_HASH_CHECK_NOT_SET_ATTEPMTS 3
> +
> struct drm_i915_gem_request;
>
> /*
> @@ -171,6 +174,7 @@ struct intel_guc {
> /* intel_uc.c */
> void intel_uc_init_early(struct drm_i915_private *dev_priv);
> void intel_uc_init(struct drm_i915_private *dev_priv);
> +int intel_uc_load(struct drm_i915_private *dev_priv);
> bool intel_guc_recv(struct drm_i915_private *dev_priv, u32 *status);
> int intel_guc_send(struct intel_guc *guc, const u32 *action, u32 len);
> int intel_guc_sample_forcewake(struct intel_guc *guc);
> @@ -185,6 +189,10 @@ extern void intel_guc_fini(struct drm_i915_private *dev_priv);
> extern const char *intel_guc_fw_status_repr(enum intel_guc_fw_status status);
> extern int intel_guc_suspend(struct drm_i915_private *dev_priv);
> extern int intel_guc_resume(struct drm_i915_private *dev_priv);
> +void guc_interrupts_release(struct drm_i915_private *dev_priv);
> +void guc_interrupts_capture(struct drm_i915_private *dev_priv);
> +int guc_hw_reset(struct drm_i915_private *dev_priv);
> +u32 guc_wopcm_size(struct drm_i915_private *dev_priv);
>
> /* i915_guc_submission.c */
> int i915_guc_submission_init(struct drm_i915_private *dev_priv);
>
_______________________________________________
Intel-gfx mailing list
Intel-gfx@lists.freedesktop.org
https://lists.freedesktop.org/mailman/listinfo/intel-gfx
next prev parent reply other threads:[~2016-12-15 22:26 UTC|newest]
Thread overview: 23+ messages / expand[flat|nested] mbox.gz Atom feed top
2016-12-15 15:47 [PATCH 0/5] GuC Scrub vol. 1 Arkadiusz Hiler
2016-12-15 15:47 ` [PATCH 1/5] drm/i915/guc: Rename _setup() to _load() Arkadiusz Hiler
2016-12-15 15:57 ` Chris Wilson
2016-12-16 11:47 ` Arkadiusz Hiler
2016-12-16 12:47 ` Chris Wilson
2016-12-15 16:22 ` Michal Wajdeczko
2016-12-16 11:43 ` Arkadiusz Hiler
2016-12-15 15:47 ` [PATCH 2/5] drm/i915/guc: Introduce intel_uc_init() Arkadiusz Hiler
2016-12-20 22:00 ` Srivatsa, Anusha
2016-12-27 16:24 ` Arkadiusz Hiler
2016-12-15 15:47 ` [PATCH 3/5] drm/i915/guc: Simplify intel_guc_load() Arkadiusz Hiler
2016-12-15 16:38 ` Michal Wajdeczko
2016-12-16 10:52 ` Arkadiusz Hiler
2016-12-15 22:26 ` Daniele Ceraolo Spurio [this message]
2016-12-16 11:16 ` Arkadiusz Hiler
2016-12-16 18:26 ` Daniele Ceraolo Spurio
2016-12-16 15:50 ` Tvrtko Ursulin
2016-12-15 15:47 ` [PATCH 4/5] drm/i915/guc: Extract param logic form guc_init Arkadiusz Hiler
2016-12-23 21:19 ` Daniele Ceraolo Spurio
2016-12-27 16:26 ` Arkadiusz Hiler
2016-12-15 15:47 ` [PATCH 5/5] drm/i915/guc: Simplify guc_fw_path Arkadiusz Hiler
2016-12-16 16:01 ` Tvrtko Ursulin
2016-12-15 17:51 ` ✗ Fi.CI.BAT: failure for GuC Scrub vol. 1 Patchwork
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=dff2b343-a3ab-c45b-ff01-c7e326346537@intel.com \
--to=daniele.ceraolospurio@intel.com \
--cc=arkadiusz.hiler@intel.com \
--cc=intel-gfx@lists.freedesktop.org \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox