drm/i915/gt: Close race between engine_park and intel_gt_retire_requests

author Chris Wilson <chris@chris-wilson.co.uk>

Wed, 20 Nov 2019 16:55:13 +0000 (16:55 +0000)

committer Andrea Righi <andrea.righi@canonical.com>

Mon, 24 Feb 2020 20:35:40 +0000 (21:35 +0100)
author Chris Wilson <chris@chris-wilson.co.uk>
Wed, 20 Nov 2019 16:55:13 +0000 (16:55 +0000)
committer Andrea Righi <andrea.righi@canonical.com>
Mon, 24 Feb 2020 20:35:40 +0000 (21:35 +0100)
diff --git a/drivers/gpu/drm/i915/gt/intel_timeline.c b/drivers/gpu/drm/i915/gt/intel_timeline.c

index 9cb01d9828f1dbc189793c297b9cf42d7088bf00..898c51b346fc4efdc887696639a976f94f394b69 100644 (file)
--- a/drivers/gpu/drm/i915/gt/intel_timeline.c
+++ b/drivers/gpu/drm/i915/gt/intel_timeline.c
@@ -339,15 +339,33 @@ void intel_timeline_enter(struct intel_timeline *tl)
         struct intel_gt_timelines *timelines = &tl->gt->timelines;
         unsigned long flags;
  
+       /*
+        * Pretend we are serialised by the timeline->mutex.
+        *
+        * While generally true, there are a few exceptions to the rule
+        * for the engine->kernel_context being used to manage power
+        * transitions. As the engine_park may be called from under any
+        * timeline, it uses the power mutex as a global serialisation
+        * lock to prevent any other request entering its timeline.
+        *
+        * The rule is generally tl->mutex, otherwise engine->wakeref.mutex.
+        *
+        * However, intel_gt_retire_request() does not know which engine
+        * it is retiring along and so cannot partake in the engine-pm
+        * barrier, and there we use the tl->active_count as a means to
+        * pin the timeline in the active_list while the locks are dropped.
+        * Ergo, as that is outside of the engine-pm barrier, we need to
+        * use atomic to manipulate tl->active_count.
+        */
         lockdep_assert_held(&tl->mutex);
-
         GEM_BUG_ON(!atomic_read(&tl->pin_count));
-       if (tl->active_count++)
+
+       if (atomic_add_unless(&tl->active_count, 1, 0))
                 return;
-       GEM_BUG_ON(!tl->active_count); /* overflow? */
  
         spin_lock_irqsave(&timelines->lock, flags);
-       list_add(&tl->link, &timelines->active_list);
+       if (!atomic_fetch_inc(&tl->active_count))
+               list_add_tail(&tl->link, &timelines->active_list);
         spin_unlock_irqrestore(&timelines->lock, flags);
  }
  
@@ -356,14 +374,16 @@ void intel_timeline_exit(struct intel_timeline *tl)
         struct intel_gt_timelines *timelines = &tl->gt->timelines;
         unsigned long flags;
  
+       /* See intel_timeline_enter() */
         lockdep_assert_held(&tl->mutex);
  
-       GEM_BUG_ON(!tl->active_count);
-       if (--tl->active_count)
+       GEM_BUG_ON(!atomic_read(&tl->active_count));
+       if (atomic_add_unless(&tl->active_count, -1, 1))
                 return;
  
         spin_lock_irqsave(&timelines->lock, flags);
-       list_del(&tl->link);
+       if (atomic_dec_and_test(&tl->active_count))
+               list_del(&tl->link);
         spin_unlock_irqrestore(&timelines->lock, flags);
  
         /*
diff --git a/drivers/gpu/drm/i915/gt/intel_timeline_types.h b/drivers/gpu/drm/i915/gt/intel_timeline_types.h

index 2b1baf2fcc8e438351e4027b1aa19ea5b31b0ad8..fc80c40f9bc3364e2c79a39ec5904f24c9ba27ed 100644 (file)
--- a/drivers/gpu/drm/i915/gt/intel_timeline_types.h
+++ b/drivers/gpu/drm/i915/gt/intel_timeline_types.h
@@ -42,7 +42,7 @@ struct intel_timeline {
          * from the intel_context caller plus internal atomicity.
          */
         atomic_t pin_count;
-       unsigned int active_count;
+       atomic_t active_count;
  
         const u32 *hwsp_seqno;
         struct i915_vma *hwsp_ggtt;
diff --git a/drivers/gpu/drm/i915/i915_request.c b/drivers/gpu/drm/i915/i915_request.c

index 1c5506822dc7296a9d247de9cbf0330a55f55cb2..2f4ac438b96c7fd3bf74a0203394a6dddd215726 100644 (file)
--- a/drivers/gpu/drm/i915/i915_request.c
+++ b/drivers/gpu/drm/i915/i915_request.c
@@ -1513,8 +1513,8 @@ bool i915_retire_requests(struct drm_i915_private *i915)
                         continue;
  
                 intel_timeline_get(tl);
-               GEM_BUG_ON(!tl->active_count);
-               tl->active_count++; /* pin the list element */
+               GEM_BUG_ON(!atomic_read(&tl->active_count));
+               atomic_inc(&tl->active_count); /* pin the list element */
                 spin_unlock_irqrestore(&timelines->lock, flags);
  
                 retire_requests(tl);
@@ -1523,14 +1523,14 @@ bool i915_retire_requests(struct drm_i915_private *i915)
  
                 /* Resume iteration after dropping lock */
                 list_safe_reset_next(tl, tn, link);
-               if (!--tl->active_count)
+               if (atomic_dec_and_test(&tl->active_count))
                         list_del(&tl->link);
  
                 mutex_unlock(&tl->mutex);
  
                 /* Defer the final release to after the spinlock */
                 if (refcount_dec_and_test(&tl->kref.refcount)) {
-                       GEM_BUG_ON(tl->active_count);
+                       GEM_BUG_ON(atomic_read(&tl->active_count));
                         list_add(&tl->link, &free);
                 }
         }
author	Chris Wilson <chris@chris-wilson.co.uk>
	Wed, 20 Nov 2019 16:55:13 +0000 (16:55 +0000)
committer	Andrea Righi <andrea.righi@canonical.com>
	Mon, 24 Feb 2020 20:35:40 +0000 (21:35 +0100)
drivers/gpu/drm/i915/gt/intel_timeline.c		patch \| blob \| blame \| history
drivers/gpu/drm/i915/gt/intel_timeline_types.h		patch \| blob \| blame \| history
drivers/gpu/drm/i915/i915_request.c		patch \| blob \| blame \| history