drm/i915/gt: Close race between engine_park and intel_gt_retire_requests

author Chris Wilson <chris@chris-wilson.co.uk>

Wed, 20 Nov 2019 16:55:13 +0000 (16:55 +0000)

committer Chris Wilson <chris@chris-wilson.co.uk>

Wed, 20 Nov 2019 16:57:33 +0000 (16:57 +0000)
author Chris Wilson <chris@chris-wilson.co.uk>
Wed, 20 Nov 2019 16:55:13 +0000 (16:55 +0000)
committer Chris Wilson <chris@chris-wilson.co.uk>
Wed, 20 Nov 2019 16:57:33 +0000 (16:57 +0000)
diff --git a/drivers/gpu/drm/i915/gt/intel_gt_requests.c b/drivers/gpu/drm/i915/gt/intel_gt_requests.c

index 25291e2af21e4c139018e4386a635a3ed41a82f6..1a005da8c5881b7ff74f46ad57de58cc8c8003d2 100644 (file)
--- a/drivers/gpu/drm/i915/gt/intel_gt_requests.c
+++ b/drivers/gpu/drm/i915/gt/intel_gt_requests.c
@@ -49,8 +49,8 @@ long intel_gt_retire_requests_timeout(struct intel_gt *gt, long timeout)
                         continue;
  
                 intel_timeline_get(tl);
-               GEM_BUG_ON(!tl->active_count);
-               tl->active_count++; /* pin the list element */
+               GEM_BUG_ON(!atomic_read(&tl->active_count));
+               atomic_inc(&tl->active_count); /* pin the list element */
                 spin_unlock_irqrestore(&timelines->lock, flags);
  
                 if (timeout > 0) {
@@ -71,14 +71,14 @@ long intel_gt_retire_requests_timeout(struct intel_gt *gt, long timeout)
  
                 /* Resume iteration after dropping lock */
                 list_safe_reset_next(tl, tn, link);
-               if (!--tl->active_count)
+               if (atomic_dec_and_test(&tl->active_count))
                         list_del(&tl->link);
  
                 mutex_unlock(&tl->mutex);
  
                 /* Defer the final release to after the spinlock */
                 if (refcount_dec_and_test(&tl->kref.refcount)) {
-                       GEM_BUG_ON(tl->active_count);
+                       GEM_BUG_ON(atomic_read(&tl->active_count));
                         list_add(&tl->link, &free);
                 }
         }
diff --git a/drivers/gpu/drm/i915/gt/intel_timeline.c b/drivers/gpu/drm/i915/gt/intel_timeline.c

index 0e277835aad05f4fc7e0f828e9c81e069a84a33b..b35f12729983b0ff8a754296c78f98c502f5fc8c 100644 (file)
--- a/drivers/gpu/drm/i915/gt/intel_timeline.c
+++ b/drivers/gpu/drm/i915/gt/intel_timeline.c
@@ -334,15 +334,33 @@ void intel_timeline_enter(struct intel_timeline *tl)
         struct intel_gt_timelines *timelines = &tl->gt->timelines;
         unsigned long flags;
  
+       /*
+        * Pretend we are serialised by the timeline->mutex.
+        *
+        * While generally true, there are a few exceptions to the rule
+        * for the engine->kernel_context being used to manage power
+        * transitions. As the engine_park may be called from under any
+        * timeline, it uses the power mutex as a global serialisation
+        * lock to prevent any other request entering its timeline.
+        *
+        * The rule is generally tl->mutex, otherwise engine->wakeref.mutex.
+        *
+        * However, intel_gt_retire_request() does not know which engine
+        * it is retiring along and so cannot partake in the engine-pm
+        * barrier, and there we use the tl->active_count as a means to
+        * pin the timeline in the active_list while the locks are dropped.
+        * Ergo, as that is outside of the engine-pm barrier, we need to
+        * use atomic to manipulate tl->active_count.
+        */
         lockdep_assert_held(&tl->mutex);
-
         GEM_BUG_ON(!atomic_read(&tl->pin_count));
-       if (tl->active_count++)
+
+       if (atomic_add_unless(&tl->active_count, 1, 0))
                 return;
-       GEM_BUG_ON(!tl->active_count); /* overflow? */
  
         spin_lock_irqsave(&timelines->lock, flags);
-       list_add_tail(&tl->link, &timelines->active_list);
+       if (!atomic_fetch_inc(&tl->active_count))
+               list_add_tail(&tl->link, &timelines->active_list);
         spin_unlock_irqrestore(&timelines->lock, flags);
  }
  
@@ -351,14 +369,16 @@ void intel_timeline_exit(struct intel_timeline *tl)
         struct intel_gt_timelines *timelines = &tl->gt->timelines;
         unsigned long flags;
  
+       /* See intel_timeline_enter() */
         lockdep_assert_held(&tl->mutex);
  
-       GEM_BUG_ON(!tl->active_count);
-       if (--tl->active_count)
+       GEM_BUG_ON(!atomic_read(&tl->active_count));
+       if (atomic_add_unless(&tl->active_count, -1, 1))
                 return;
  
         spin_lock_irqsave(&timelines->lock, flags);
-       list_del(&tl->link);
+       if (atomic_dec_and_test(&tl->active_count))
+               list_del(&tl->link);
         spin_unlock_irqrestore(&timelines->lock, flags);
  
         /*
diff --git a/drivers/gpu/drm/i915/gt/intel_timeline_types.h b/drivers/gpu/drm/i915/gt/intel_timeline_types.h

index 98d9ee166379518f6bceb8619241d22f5bb7a856..5244615ed1cb4a13b5a81737bcd67e75e7472b09 100644 (file)
--- a/drivers/gpu/drm/i915/gt/intel_timeline_types.h
+++ b/drivers/gpu/drm/i915/gt/intel_timeline_types.h
@@ -42,7 +42,7 @@ struct intel_timeline {
          * from the intel_context caller plus internal atomicity.
          */
         atomic_t pin_count;
-       unsigned int active_count;
+       atomic_t active_count;
  
         const u32 *hwsp_seqno;
         struct i915_vma *hwsp_ggtt;
author	Chris Wilson <chris@chris-wilson.co.uk>
	Wed, 20 Nov 2019 16:55:13 +0000 (16:55 +0000)
committer	Chris Wilson <chris@chris-wilson.co.uk>
	Wed, 20 Nov 2019 16:57:33 +0000 (16:57 +0000)
drivers/gpu/drm/i915/gt/intel_gt_requests.c		patch \| blob \| history
drivers/gpu/drm/i915/gt/intel_timeline.c		patch \| blob \| history
drivers/gpu/drm/i915/gt/intel_timeline_types.h		patch \| blob \| history