From: Tvrtko Ursulin <tvrtko.ursulin@linux.intel.com>
To: Chris Wilson <chris@chris-wilson.co.uk>, intel-gfx@lists.freedesktop.org
Subject: Re: [PATCH v2 05/14] drm/i915: Deconstruct execute fence
Date: Fri, 17 Feb 2017 14:26:04 +0000 [thread overview]
Message-ID: <0ac032a6-5a8f-7e55-44dd-6bd3d286400b@linux.intel.com> (raw)
In-Reply-To: <20170214095413.26452-6-chris@chris-wilson.co.uk>
On 14/02/2017 09:54, Chris Wilson wrote:
> On reflection, we are only using the execute fence as a waitqueue on the
> global_seqno and not using it for dependency tracking between fences
> (unlike the submit and dma fences). By only treating it as a waitqueue,
> we can then treat it similar to the other waitqueues durin submit,
during
> making the code simpler.
>
> Signed-off-by: Chris Wilson <chris@chris-wilson.co.uk>
> ---
> drivers/gpu/drm/i915/i915_gem_request.c | 47 +++++++--------------------------
> drivers/gpu/drm/i915/i915_gem_request.h | 10 +------
> 2 files changed, 11 insertions(+), 46 deletions(-)
>
> diff --git a/drivers/gpu/drm/i915/i915_gem_request.c b/drivers/gpu/drm/i915/i915_gem_request.c
> index 001fc9fedf49..bb59acaa8a34 100644
> --- a/drivers/gpu/drm/i915/i915_gem_request.c
> +++ b/drivers/gpu/drm/i915/i915_gem_request.c
> @@ -69,7 +69,6 @@ static void i915_fence_release(struct dma_fence *fence)
> * caught trying to reuse dead objects.
> */
> i915_sw_fence_fini(&req->submit);
> - i915_sw_fence_fini(&req->execute);
>
> kmem_cache_free(req->i915->requests, req);
> }
> @@ -211,7 +210,6 @@ static void i915_gem_request_retire(struct drm_i915_gem_request *request)
>
> lockdep_assert_held(&request->i915->drm.struct_mutex);
> GEM_BUG_ON(!i915_sw_fence_signaled(&request->submit));
> - GEM_BUG_ON(!i915_sw_fence_signaled(&request->execute));
> GEM_BUG_ON(!i915_gem_request_completed(request));
>
> GEM_BUG_ON(!request->i915->gt.active_requests);
> @@ -422,7 +420,7 @@ void __i915_gem_request_submit(struct drm_i915_gem_request *request)
> list_move_tail(&request->link, &timeline->requests);
> spin_unlock(&request->timeline->lock);
>
> - i915_sw_fence_commit(&request->execute);
> + wake_up_all(&request->execute);
> }
>
> void i915_gem_request_submit(struct drm_i915_gem_request *request)
> @@ -457,24 +455,6 @@ submit_notify(struct i915_sw_fence *fence, enum i915_sw_fence_notify state)
> return NOTIFY_DONE;
> }
>
> -static int __i915_sw_fence_call
> -execute_notify(struct i915_sw_fence *fence, enum i915_sw_fence_notify state)
> -{
> - struct drm_i915_gem_request *request =
> - container_of(fence, typeof(*request), execute);
> -
> - switch (state) {
> - case FENCE_COMPLETE:
> - break;
> -
> - case FENCE_FREE:
> - i915_gem_request_put(request);
> - break;
> - }
> -
> - return NOTIFY_DONE;
> -}
> -
> /**
> * i915_gem_request_alloc - allocate a request structure
> *
> @@ -567,13 +547,7 @@ i915_gem_request_alloc(struct intel_engine_cs *engine,
>
> /* We bump the ref for the fence chain */
> i915_sw_fence_init(&i915_gem_request_get(req)->submit, submit_notify);
> - i915_sw_fence_init(&i915_gem_request_get(req)->execute, execute_notify);
> -
> - /* Ensure that the execute fence completes after the submit fence -
> - * as we complete the execute fence from within the submit fence
> - * callback, its completion would otherwise be visible first.
> - */
> - i915_sw_fence_await_sw_fence(&req->execute, &req->submit, &req->execq);
> + init_waitqueue_head(&req->execute);
>
> i915_priotree_init(&req->priotree);
>
> @@ -1015,6 +989,7 @@ long i915_wait_request(struct drm_i915_gem_request *req,
> TASK_INTERRUPTIBLE : TASK_UNINTERRUPTIBLE;
> wait_queue_head_t *errq = &req->i915->gpu_error.wait_queue;
> DEFINE_WAIT(reset);
> + DEFINE_WAIT(exec);
> struct intel_wait wait;
>
> might_sleep();
> @@ -1036,12 +1011,11 @@ long i915_wait_request(struct drm_i915_gem_request *req,
> if (flags & I915_WAIT_LOCKED)
> add_wait_queue(errq, &reset);
>
> - if (!i915_sw_fence_done(&req->execute)) {
> - DEFINE_WAIT(exec);
> -
> + reset_wait_queue(&req->execute, &exec);
> + if (!req->global_seqno) {
> do {
> - prepare_to_wait(&req->execute.wait, &exec, state);
Somehow I missed the moment when reset_wait_queue was introduced. But
why you can't just use prepare_to_wait here?
Otherwise looks OK.
Regards,
Tvrtko
> - if (i915_sw_fence_done(&req->execute))
> + set_current_state(state);
> + if (req->global_seqno)
> break;
>
> if (flags & I915_WAIT_LOCKED &&
> @@ -1064,15 +1038,14 @@ long i915_wait_request(struct drm_i915_gem_request *req,
>
> timeout = io_schedule_timeout(timeout);
> } while (1);
> - finish_wait(&req->execute.wait, &exec);
> + finish_wait(&req->execute, &exec);
>
> if (timeout < 0)
> goto complete;
>
> - GEM_BUG_ON(!i915_sw_fence_done(&req->execute));
> + GEM_BUG_ON(!req->global_seqno);
> }
> - GEM_BUG_ON(!i915_sw_fence_done(&req->submit));
> - GEM_BUG_ON(!req->global_seqno);
> + GEM_BUG_ON(!i915_sw_fence_signaled(&req->submit));
>
> /* Optimistic short spin before touching IRQs */
> if (i915_spin_request(req, state, 5))
> diff --git a/drivers/gpu/drm/i915/i915_gem_request.h b/drivers/gpu/drm/i915/i915_gem_request.h
> index 9049936c571c..467d3e13fce0 100644
> --- a/drivers/gpu/drm/i915/i915_gem_request.h
> +++ b/drivers/gpu/drm/i915/i915_gem_request.h
> @@ -119,18 +119,10 @@ struct drm_i915_gem_request {
> * The submit fence is used to await upon all of the request's
> * dependencies. When it is signaled, the request is ready to run.
> * It is used by the driver to then queue the request for execution.
> - *
> - * The execute fence is used to signal when the request has been
> - * sent to hardware.
> - *
> - * It is illegal for the submit fence of one request to wait upon the
> - * execute fence of an earlier request. It should be sufficient to
> - * wait upon the submit fence of the earlier request.
> */
> struct i915_sw_fence submit;
> - struct i915_sw_fence execute;
> wait_queue_t submitq;
> - wait_queue_t execq;
> + wait_queue_head_t execute;
>
> /* A list of everyone we wait upon, and everyone who waits upon us.
> * Even though we will not be submitted to the hardware before the
>
_______________________________________________
Intel-gfx mailing list
Intel-gfx@lists.freedesktop.org
https://lists.freedesktop.org/mailman/listinfo/intel-gfx
next prev parent reply other threads:[~2017-02-17 14:26 UTC|newest]
Thread overview: 30+ messages / expand[flat|nested] mbox.gz Atom feed top
2017-02-14 9:53 Prep work for preemption and GEM bugfixes Chris Wilson
2017-02-14 9:54 ` [PATCH v2 01/14] drm/i915: Keep a global seqno per-engine Chris Wilson
2017-02-15 17:05 ` Tvrtko Ursulin
2017-02-15 21:49 ` Chris Wilson
2017-02-15 22:20 ` Chris Wilson
2017-02-15 22:36 ` Chris Wilson
2017-02-16 8:10 ` Tvrtko Ursulin
2017-02-16 8:28 ` Chris Wilson
2017-02-14 9:54 ` [PATCH v2 02/14] drm/i915: Use a local to shorten req->i915->gpu_error.wait_queue Chris Wilson
2017-02-15 17:06 ` Tvrtko Ursulin
2017-02-14 9:54 ` [PATCH v2 03/14] drm/i915: Add ourselves to the gpu error waitqueue for the entire wait Chris Wilson
2017-02-15 17:11 ` Tvrtko Ursulin
2017-02-14 9:54 ` [PATCH v2 04/14] drm/i915: Inline __i915_gem_request_wait_for_execute() Chris Wilson
2017-02-17 14:04 ` Tvrtko Ursulin
2017-02-14 9:54 ` [PATCH v2 05/14] drm/i915: Deconstruct execute fence Chris Wilson
2017-02-17 14:26 ` Tvrtko Ursulin [this message]
2017-02-17 14:41 ` Chris Wilson
2017-02-17 14:55 ` Tvrtko Ursulin
2017-02-14 9:54 ` [PATCH v2 06/14] drm/i915: Protect the request->global_seqno with the engine->timeline lock Chris Wilson
2017-02-17 14:43 ` Tvrtko Ursulin
2017-02-22 12:38 ` Chris Wilson
2017-02-14 9:54 ` [PATCH v2 07/14] drm/i915: Take a reference whilst processing the signaler request Chris Wilson
2017-02-14 9:54 ` [PATCH v2 08/14] drm/i915: Allow an request to be cancelled Chris Wilson
2017-02-14 9:54 ` [PATCH v2 09/14] drm/i915: Remove the preempted request from the execution queue Chris Wilson
2017-02-14 9:54 ` [PATCH v2 10/14] drm/i915: Exercise request cancellation using a mock selftest Chris Wilson
2017-02-14 9:54 ` [PATCH v2 11/14] drm/i915: Replace reset_wait_queue with default_wake_function Chris Wilson
2017-02-14 9:54 ` [PATCH v2 12/14] drm/i915: Refactor direct GPU reset from request waiters Chris Wilson
2017-02-14 9:54 ` [PATCH v2 13/14] drm/i915: Immediately process a reset before starting waiting Chris Wilson
2017-02-14 9:54 ` [PATCH v2 14/14] drm/i915: Remove one level of indention from wait-for-execute Chris Wilson
2017-02-14 11:52 ` ✓ Fi.CI.BAT: success for series starting with [v2,01/14] drm/i915: Keep a global seqno per-engine Patchwork
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=0ac032a6-5a8f-7e55-44dd-6bd3d286400b@linux.intel.com \
--to=tvrtko.ursulin@linux.intel.com \
--cc=chris@chris-wilson.co.uk \
--cc=intel-gfx@lists.freedesktop.org \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox