From: Daniel Vetter <daniel@ffwll.ch>
To: Chris Wilson <chris@chris-wilson.co.uk>
Cc: Daniel Vetter <daniel.vetter@ffwll.ch>, intel-gfx@lists.freedesktop.org
Subject: Re: [PATCH 17/22] drm/i915: Use atomics to manipulate obj->frontbuffer_bits
Date: Thu, 28 Jul 2016 12:05:03 +0200 [thread overview]
Message-ID: <20160728100503.GE6232@phenom.ffwll.local> (raw)
In-Reply-To: <1469618100-15298-18-git-send-email-chris@chris-wilson.co.uk>
On Wed, Jul 27, 2016 at 12:14:55PM +0100, Chris Wilson wrote:
> The individual bits inside obj->frontbuffer_bits are protected by each
> plane->mutex, but the whole bitfield may be accessed by multiple KMS
> operations simultaneously and so the RMW need to be under atomics.
> However, for updating the single field we do not need to mandate that it
> be under the struct_mutex, one more step towards its removal as the de
> facto BKL.
>
> Signed-off-by: Chris Wilson <chris@chris-wilson.co.uk>
> Cc: Daniel Vetter <daniel.vetter@ffwll.ch>
Reviewed-by: Daniel Vetter <daniel.vetter@ffwll.ch>
> ---
> drivers/gpu/drm/i915/i915_debugfs.c | 6 ++++--
> drivers/gpu/drm/i915/i915_drv.h | 4 +---
> drivers/gpu/drm/i915/i915_gem.c | 18 +++++++++++-------
> drivers/gpu/drm/i915/intel_display.c | 18 ++++++------------
> drivers/gpu/drm/i915/intel_drv.h | 20 ++++++++++++++------
> drivers/gpu/drm/i915/intel_frontbuffer.c | 23 +++++++++--------------
> 6 files changed, 45 insertions(+), 44 deletions(-)
>
> diff --git a/drivers/gpu/drm/i915/i915_debugfs.c b/drivers/gpu/drm/i915/i915_debugfs.c
> index fcfa9ca6b50a..10a346237795 100644
> --- a/drivers/gpu/drm/i915/i915_debugfs.c
> +++ b/drivers/gpu/drm/i915/i915_debugfs.c
> @@ -138,6 +138,7 @@ describe_obj(struct seq_file *m, struct drm_i915_gem_object *obj)
> struct drm_i915_private *dev_priv = to_i915(obj->base.dev);
> struct intel_engine_cs *engine;
> struct i915_vma *vma;
> + unsigned int frontbuffer_bits;
> int pin_count = 0;
> enum intel_engine_id id;
>
> @@ -204,8 +205,9 @@ describe_obj(struct seq_file *m, struct drm_i915_gem_object *obj)
> if (engine)
> seq_printf(m, " (%s)", engine->name);
>
> - if (obj->frontbuffer_bits)
> - seq_printf(m, " (frontbuffer: 0x%03x)", obj->frontbuffer_bits);
> + frontbuffer_bits = atomic_read(&obj->frontbuffer_bits);
> + if (frontbuffer_bits)
> + seq_printf(m, " (frontbuffer: 0x%03x)", frontbuffer_bits);
> }
>
> static int i915_gem_object_list_info(struct seq_file *m, void *data)
> diff --git a/drivers/gpu/drm/i915/i915_drv.h b/drivers/gpu/drm/i915/i915_drv.h
> index a24d31e3e014..b6b9a1f78238 100644
> --- a/drivers/gpu/drm/i915/i915_drv.h
> +++ b/drivers/gpu/drm/i915/i915_drv.h
> @@ -2127,8 +2127,6 @@ struct drm_i915_gem_object_ops {
> */
> #define INTEL_MAX_SPRITE_BITS_PER_PIPE 5
> #define INTEL_FRONTBUFFER_BITS_PER_PIPE 8
> -#define INTEL_FRONTBUFFER_BITS \
> - (INTEL_FRONTBUFFER_BITS_PER_PIPE * I915_MAX_PIPES)
> #define INTEL_FRONTBUFFER_PRIMARY(pipe) \
> (1 << (INTEL_FRONTBUFFER_BITS_PER_PIPE * (pipe)))
> #define INTEL_FRONTBUFFER_CURSOR(pipe) \
> @@ -2216,7 +2214,7 @@ struct drm_i915_gem_object {
> unsigned int cache_level:3;
> unsigned int cache_dirty:1;
>
> - unsigned int frontbuffer_bits:INTEL_FRONTBUFFER_BITS;
> + atomic_t frontbuffer_bits;
>
> unsigned int has_wc_mmap;
> /** Count of VMA actually bound by this object */
> diff --git a/drivers/gpu/drm/i915/i915_gem.c b/drivers/gpu/drm/i915/i915_gem.c
> index 7db0808f6961..bc5bc5ccdde0 100644
> --- a/drivers/gpu/drm/i915/i915_gem.c
> +++ b/drivers/gpu/drm/i915/i915_gem.c
> @@ -4031,7 +4031,7 @@ void i915_gem_free_object(struct drm_gem_object *gem_obj)
> if (obj->stolen)
> i915_gem_object_unpin_pages(obj);
>
> - WARN_ON(obj->frontbuffer_bits);
> + WARN_ON(atomic_read(&obj->frontbuffer_bits));
>
> if (obj->pages && obj->madv == I915_MADV_WILLNEED &&
> dev_priv->quirks & QUIRK_PIN_SWIZZLED_PAGES &&
> @@ -4549,16 +4549,20 @@ void i915_gem_track_fb(struct drm_i915_gem_object *old,
> struct drm_i915_gem_object *new,
> unsigned frontbuffer_bits)
> {
> + /* Control of individual bits within the bitfield are guarded by
> + * the owning plane->mutex, i.e. we can never see concurrent
> + * manipulation of individual bits. But since the bitfield as a whole
> + * is updated using RMW, we need to use atomics in order to update
> + * the bits.
> + */
> if (old) {
> - WARN_ON(!mutex_is_locked(&old->base.dev->struct_mutex));
> - WARN_ON(!(old->frontbuffer_bits & frontbuffer_bits));
> - old->frontbuffer_bits &= ~frontbuffer_bits;
> + WARN_ON(!(atomic_read(&old->frontbuffer_bits) & frontbuffer_bits));
> + atomic_andnot(frontbuffer_bits, &old->frontbuffer_bits);
> }
>
> if (new) {
> - WARN_ON(!mutex_is_locked(&new->base.dev->struct_mutex));
> - WARN_ON(new->frontbuffer_bits & frontbuffer_bits);
> - new->frontbuffer_bits |= frontbuffer_bits;
> + WARN_ON(atomic_read(&new->frontbuffer_bits) & frontbuffer_bits);
> + atomic_or(frontbuffer_bits, &new->frontbuffer_bits);
> }
> }
>
> diff --git a/drivers/gpu/drm/i915/intel_display.c b/drivers/gpu/drm/i915/intel_display.c
> index ed2069c56036..1c70f68328b4 100644
> --- a/drivers/gpu/drm/i915/intel_display.c
> +++ b/drivers/gpu/drm/i915/intel_display.c
> @@ -2600,7 +2600,8 @@ valid_fb:
> primary->fb = primary->state->fb = fb;
> primary->crtc = primary->state->crtc = &intel_crtc->base;
> intel_crtc->base.state->plane_mask |= (1 << drm_plane_index(primary));
> - obj->frontbuffer_bits |= to_intel_plane(primary)->frontbuffer_bit;
> + atomic_or(to_intel_plane(primary)->frontbuffer_bit,
> + &obj->frontbuffer_bits);
> }
>
> static void i9xx_update_primary_plane(struct drm_plane *primary,
> @@ -13807,19 +13808,12 @@ static void intel_atomic_track_fbs(struct drm_atomic_state *state)
> {
> struct drm_plane_state *old_plane_state;
> struct drm_plane *plane;
> - struct drm_i915_gem_object *obj, *old_obj;
> - struct intel_plane *intel_plane;
> int i;
>
> - mutex_lock(&state->dev->struct_mutex);
> - for_each_plane_in_state(state, plane, old_plane_state, i) {
> - obj = intel_fb_obj(plane->state->fb);
> - old_obj = intel_fb_obj(old_plane_state->fb);
> - intel_plane = to_intel_plane(plane);
> -
> - i915_gem_track_fb(old_obj, obj, intel_plane->frontbuffer_bit);
> - }
> - mutex_unlock(&state->dev->struct_mutex);
> + for_each_plane_in_state(state, plane, old_plane_state, i)
> + i915_gem_track_fb(intel_fb_obj(old_plane_state->fb),
> + intel_fb_obj(plane->state->fb),
> + to_intel_plane(plane)->frontbuffer_bit);
> }
>
> /**
> diff --git a/drivers/gpu/drm/i915/intel_drv.h b/drivers/gpu/drm/i915/intel_drv.h
> index 01056ce8d461..5294039cf238 100644
> --- a/drivers/gpu/drm/i915/intel_drv.h
> +++ b/drivers/gpu/drm/i915/intel_drv.h
> @@ -1147,27 +1147,35 @@ unsigned int intel_fb_align_height(struct drm_device *dev,
> uint64_t fb_format_modifier);
>
> void __intel_fb_obj_invalidate(struct drm_i915_gem_object *obj,
> - enum fb_op_origin origin);
> + enum fb_op_origin origin,
> + unsigned int frontbuffer_bits);
> static inline void intel_fb_obj_invalidate(struct drm_i915_gem_object *obj,
> enum fb_op_origin origin)
> {
> - if (!obj->frontbuffer_bits)
> + unsigned int frontbuffer_bits;
> +
> + frontbuffer_bits = atomic_read(&obj->frontbuffer_bits);
> + if (!frontbuffer_bits)
> return;
>
> - __intel_fb_obj_invalidate(obj, origin);
> + __intel_fb_obj_invalidate(obj, origin, frontbuffer_bits);
> }
>
> void __intel_fb_obj_flush(struct drm_i915_gem_object *obj,
> bool retire,
> - enum fb_op_origin origin);
> + enum fb_op_origin origin,
> + unsigned int frontbuffer_tibst);
> static inline void intel_fb_obj_flush(struct drm_i915_gem_object *obj,
> bool retire,
> enum fb_op_origin origin)
> {
> - if (!obj->frontbuffer_bits)
> + unsigned int frontbuffer_bits;
> +
> + frontbuffer_bits = atomic_read(&obj->frontbuffer_bits);
> + if (!frontbuffer_bits)
> return;
>
> - __intel_fb_obj_flush(obj, retire, origin);
> + __intel_fb_obj_flush(obj, retire, origin, frontbuffer_bits);
> }
>
> u32 intel_fb_stride_alignment(const struct drm_i915_private *dev_priv,
> diff --git a/drivers/gpu/drm/i915/intel_frontbuffer.c b/drivers/gpu/drm/i915/intel_frontbuffer.c
> index a38ccfe4894a..636324da21c2 100644
> --- a/drivers/gpu/drm/i915/intel_frontbuffer.c
> +++ b/drivers/gpu/drm/i915/intel_frontbuffer.c
> @@ -77,23 +77,22 @@
> * scheduled.
> */
> void __intel_fb_obj_invalidate(struct drm_i915_gem_object *obj,
> - enum fb_op_origin origin)
> + enum fb_op_origin origin,
> + unsigned int frontbuffer_bits)
> {
> struct drm_device *dev = obj->base.dev;
> struct drm_i915_private *dev_priv = to_i915(dev);
>
> - WARN_ON(!mutex_is_locked(&dev->struct_mutex));
> -
> if (origin == ORIGIN_CS) {
> spin_lock(&dev_priv->fb_tracking.lock);
> - dev_priv->fb_tracking.busy_bits |= obj->frontbuffer_bits;
> - dev_priv->fb_tracking.flip_bits &= ~obj->frontbuffer_bits;
> + dev_priv->fb_tracking.busy_bits |= frontbuffer_bits;
> + dev_priv->fb_tracking.flip_bits &= ~frontbuffer_bits;
> spin_unlock(&dev_priv->fb_tracking.lock);
> }
>
> - intel_psr_invalidate(dev, obj->frontbuffer_bits);
> - intel_edp_drrs_invalidate(dev, obj->frontbuffer_bits);
> - intel_fbc_invalidate(dev_priv, obj->frontbuffer_bits, origin);
> + intel_psr_invalidate(dev, frontbuffer_bits);
> + intel_edp_drrs_invalidate(dev, frontbuffer_bits);
> + intel_fbc_invalidate(dev_priv, frontbuffer_bits, origin);
> }
>
> /**
> @@ -139,15 +138,11 @@ static void intel_frontbuffer_flush(struct drm_device *dev,
> */
> void __intel_fb_obj_flush(struct drm_i915_gem_object *obj,
> bool retire,
> - enum fb_op_origin origin)
> + enum fb_op_origin origin,
> + unsigned int frontbuffer_bits)
> {
> struct drm_device *dev = obj->base.dev;
> struct drm_i915_private *dev_priv = to_i915(dev);
> - unsigned frontbuffer_bits;
> -
> - WARN_ON(!mutex_is_locked(&dev->struct_mutex));
> -
> - frontbuffer_bits = obj->frontbuffer_bits;
>
> if (retire) {
> spin_lock(&dev_priv->fb_tracking.lock);
> --
> 2.8.1
>
--
Daniel Vetter
Software Engineer, Intel Corporation
http://blog.ffwll.ch
_______________________________________________
Intel-gfx mailing list
Intel-gfx@lists.freedesktop.org
https://lists.freedesktop.org/mailman/listinfo/intel-gfx
next prev parent reply other threads:[~2016-07-28 10:05 UTC|newest]
Thread overview: 95+ messages / expand[flat|nested] mbox.gz Atom feed top
2016-07-27 11:14 Getting to RCU and exporting fences Chris Wilson
2016-07-27 11:14 ` [PATCH 01/22] drm/i915: Combine loops within i915_gem_evict_something Chris Wilson
2016-07-29 6:17 ` Joonas Lahtinen
2016-07-29 6:31 ` Chris Wilson
2016-07-27 11:14 ` [PATCH 02/22] drm/i915: Remove surplus drm_device parameter to i915_gem_evict_something() Chris Wilson
2016-07-28 8:07 ` Joonas Lahtinen
2016-07-27 11:14 ` [PATCH 03/22] drm/i915: Double check the active status on the batch pool Chris Wilson
2016-07-28 8:14 ` Joonas Lahtinen
2016-07-27 11:14 ` [PATCH 04/22] drm/i915: Remove request retirement before each batch Chris Wilson
2016-07-28 8:32 ` Joonas Lahtinen
2016-07-28 9:32 ` Chris Wilson
2016-07-28 9:53 ` Joonas Lahtinen
2016-07-28 9:54 ` Daniel Vetter
2016-07-28 10:26 ` Chris Wilson
2016-07-28 11:52 ` Daniel Vetter
2016-07-28 12:24 ` Chris Wilson
2016-07-28 14:21 ` Chris Wilson
2016-07-27 11:14 ` [PATCH 05/22] drm/i915: Remove i915_gem_execbuffer_retire_commands() Chris Wilson
2016-07-28 8:46 ` Joonas Lahtinen
2016-07-28 8:55 ` Chris Wilson
2016-07-28 9:54 ` Joonas Lahtinen
2016-07-27 11:14 ` [PATCH 06/22] drm/i915: Fix up vma alignment to be u64 Chris Wilson
2016-07-28 8:59 ` Joonas Lahtinen
2016-07-27 11:14 ` [PATCH 07/22] drm/i915: Pad GTT views of exec objects up to user specified size Chris Wilson
2016-07-28 9:55 ` Daniel Vetter
2016-07-28 10:33 ` Chris Wilson
2016-07-29 7:59 ` Joonas Lahtinen
2016-07-29 8:08 ` Chris Wilson
2016-07-29 8:55 ` Joonas Lahtinen
2016-07-27 11:14 ` [PATCH 08/22] drm/i915: Reduce WARN(i915_gem_valid_gtt_space) to a debug-only check Chris Wilson
2016-07-28 9:18 ` Joonas Lahtinen
2016-07-27 11:14 ` [PATCH 09/22] drm/i915: Split insertion/binding of an object into the VM Chris Wilson
2016-07-28 9:25 ` Joonas Lahtinen
2016-07-28 9:34 ` Chris Wilson
2016-07-27 11:14 ` [PATCH 10/22] drm/i915: Record allocated vma size Chris Wilson
2016-07-29 6:53 ` Joonas Lahtinen
2016-07-29 7:18 ` Chris Wilson
2016-07-29 10:19 ` [PATCH] drm/i915: Convert 4096 alignment request to 0 for drm_mm allocations Chris Wilson
2016-07-29 10:28 ` Joonas Lahtinen
2016-07-29 10:38 ` Chris Wilson
2016-07-27 11:14 ` [PATCH 11/22] drm/i915: Wrap vma->pin_count accessors with small inline helpers Chris Wilson
2016-07-29 6:59 ` Joonas Lahtinen
2016-07-29 7:23 ` Chris Wilson
2016-07-27 11:14 ` [PATCH 12/22] drm/i915: Start passing around i915_vma from execbuffer Chris Wilson
2016-07-29 8:23 ` Joonas Lahtinen
2016-08-01 7:34 ` Chris Wilson
2016-07-27 11:14 ` [PATCH 13/22] drm/i915: Combine all i915_vma bitfields into a single set of flags Chris Wilson
2016-07-29 7:30 ` Joonas Lahtinen
2016-07-29 7:44 ` Chris Wilson
2016-07-27 11:14 ` [PATCH 14/22] drm/i915: Make i915_vma_pin() small and inline Chris Wilson
2016-07-28 11:06 ` Joonas Lahtinen
2016-07-27 11:14 ` [PATCH 15/22] drm/i915: Remove highly confusing i915_gem_obj_ggtt_pin() Chris Wilson
2016-07-28 10:38 ` Joonas Lahtinen
2016-07-28 11:36 ` Chris Wilson
2016-07-28 11:53 ` Joonas Lahtinen
2016-07-28 16:12 ` Chris Wilson
2016-07-29 9:10 ` Joonas Lahtinen
2016-07-27 11:14 ` [PATCH 16/22] drm/i915: Make fb_tracking.lock a spinlock Chris Wilson
2016-07-28 10:02 ` Daniel Vetter
2016-07-28 10:08 ` Daniel Vetter
2016-07-29 8:25 ` Chris Wilson
2016-07-28 10:19 ` Joonas Lahtinen
2016-07-27 11:14 ` [PATCH 17/22] drm/i915: Use atomics to manipulate obj->frontbuffer_bits Chris Wilson
2016-07-28 9:49 ` Joonas Lahtinen
2016-07-28 10:10 ` Chris Wilson
2016-07-28 10:51 ` Joonas Lahtinen
2016-07-28 10:05 ` Daniel Vetter [this message]
2016-07-27 11:14 ` [PATCH 18/22] drm/i915: Use dev_priv consistently through the intel_frontbuffer interface Chris Wilson
2016-07-28 9:36 ` Joonas Lahtinen
2016-07-28 10:06 ` Daniel Vetter
2016-07-27 11:14 ` [PATCH 19/22] drm/i915: Move obj->active:5 to obj->flags Chris Wilson
2016-07-29 7:40 ` Joonas Lahtinen
2016-07-29 8:04 ` Chris Wilson
2016-07-29 8:10 ` Chris Wilson
2016-07-29 9:34 ` Joonas Lahtinen
2016-07-27 11:14 ` [PATCH 20/22] drm/i915: Move i915_gem_object_wait_rendering() Chris Wilson
2016-07-28 9:37 ` Joonas Lahtinen
2016-07-27 11:14 ` [PATCH 21/22] drm/i915: Enable lockless lookup of request tracking via RCU Chris Wilson
2016-07-28 10:23 ` Daniel Vetter
2016-07-28 20:49 ` Chris Wilson
2016-07-29 8:41 ` Daniel Vetter
2016-07-29 8:49 ` Chris Wilson
2016-07-29 9:43 ` Chris Wilson
2016-07-29 9:45 ` Daniel Vetter
2016-07-27 11:15 ` [PATCH 22/22] drm/i915: Export our request as a dma-buf fence on the reservation object Chris Wilson
2016-07-28 10:32 ` Daniel Vetter
2016-07-28 10:40 ` Chris Wilson
2016-07-28 11:59 ` Daniel Vetter
2016-07-28 12:17 ` Chris Wilson
2016-07-28 12:28 ` Daniel Vetter
2016-07-28 12:45 ` Chris Wilson
2016-07-28 20:14 ` Daniel Vetter
2016-07-28 21:08 ` Chris Wilson
2016-07-27 11:23 ` ✗ Ro.CI.BAT: failure for series starting with [01/22] drm/i915: Combine loops within i915_gem_evict_something Patchwork
2016-07-29 10:20 ` ✗ Ro.CI.BAT: failure for series starting with [01/22] drm/i915: Combine loops within i915_gem_evict_something (rev2) Patchwork
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=20160728100503.GE6232@phenom.ffwll.local \
--to=daniel@ffwll.ch \
--cc=chris@chris-wilson.co.uk \
--cc=daniel.vetter@ffwll.ch \
--cc=intel-gfx@lists.freedesktop.org \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox