drm/i915: Prevent leaking of -EIO from i915_wait_request()

author Chris Wilson <chris@chris-wilson.co.uk>

Wed, 13 Apr 2016 16:35:08 +0000 (17:35 +0100)

committer Chris Wilson <chris@chris-wilson.co.uk>

Thu, 14 Apr 2016 09:45:40 +0000 (10:45 +0100)
author Chris Wilson <chris@chris-wilson.co.uk>
Wed, 13 Apr 2016 16:35:08 +0000 (17:35 +0100)
committer Chris Wilson <chris@chris-wilson.co.uk>
Thu, 14 Apr 2016 09:45:40 +0000 (10:45 +0100)
diff --git a/drivers/gpu/drm/i915/i915_drv.h b/drivers/gpu/drm/i915/i915_drv.h

index 54648e03db8c6cf07f2b0bab927b644386ad1359..0faca3a29868f60a5c2b253baf8eae47910a1290 100644 (file)
--- a/drivers/gpu/drm/i915/i915_drv.h
+++ b/drivers/gpu/drm/i915/i915_drv.h
@@ -3088,8 +3088,6 @@ i915_gem_find_active_request(struct intel_engine_cs *engine);
  
  bool i915_gem_retire_requests(struct drm_device *dev);
  void i915_gem_retire_requests_ring(struct intel_engine_cs *engine);
-int __must_check i915_gem_check_wedge(struct i915_gpu_error *error,
-                                     bool interruptible);
  
  static inline u32 i915_reset_counter(struct i915_gpu_error *error)
  {
diff --git a/drivers/gpu/drm/i915/i915_gem.c b/drivers/gpu/drm/i915/i915_gem.c

index a62a5ec3679a9bda622a1923ee5a40aabfb8109f..0c57b20532be6bfec39ed7b25db4618ffef53c8d 100644 (file)
--- a/drivers/gpu/drm/i915/i915_gem.c
+++ b/drivers/gpu/drm/i915/i915_gem.c
@@ -206,11 +206,10 @@ i915_gem_object_put_pages_phys(struct drm_i915_gem_object *obj)
         BUG_ON(obj->madv == __I915_MADV_PURGED);
  
         ret = i915_gem_object_set_to_cpu_domain(obj, true);
-       if (ret) {
+       if (WARN_ON(ret)) {
                 /* In the event of a disaster, abandon all caches and
                  * hope for the best.
                  */
-               WARN_ON(ret != -EIO);
                 obj->base.read_domains = obj->base.write_domain = I915_GEM_DOMAIN_CPU;
         }
  
@@ -1105,15 +1104,13 @@ i915_gem_pwrite_ioctl(struct drm_device *dev, void *data,
         return ret;
  }
  
-int
-i915_gem_check_wedge(struct i915_gpu_error *error,
-                    bool interruptible)
+static int
+i915_gem_check_wedge(unsigned reset_counter, bool interruptible)
  {
-       if (i915_reset_in_progress_or_wedged(error)) {
-               /* Recovery complete, but the reset failed ... */
-               if (i915_terminally_wedged(error))
-                       return -EIO;
+       if (__i915_terminally_wedged(reset_counter))
+               return -EIO;
  
+       if (__i915_reset_in_progress(reset_counter)) {
                 /* Non-interruptible callers can't handle -EAGAIN, hence return
                  * -EIO unconditionally for these. */
                 if (!interruptible)
@@ -1287,13 +1284,14 @@ int __i915_wait_request(struct drm_i915_gem_request *req,
                 prepare_to_wait(&engine->irq_queue, &wait, state);
  
                 /* We need to check whether any gpu reset happened in between
-                * the caller grabbing the seqno and now ... */
+                * the request being submitted and now. If a reset has occurred,
+                * the request is effectively complete (we either are in the
+                * process of or have discarded the rendering and completely
+                * reset the GPU. The results of the request are lost and we
+                * are free to continue on with the original operation.
+                */
                 if (req->reset_counter != i915_reset_counter(&dev_priv->gpu_error)) {
-                       /* ... but upgrade the -EAGAIN to an -EIO if the gpu
-                        * is truely gone. */
-                       ret = i915_gem_check_wedge(&dev_priv->gpu_error, interruptible);
-                       if (ret == 0)
-                               ret = -EAGAIN;
+                       ret = 0;
                         break;
                 }
  
@@ -2154,11 +2152,10 @@ i915_gem_object_put_pages_gtt(struct drm_i915_gem_object *obj)
         BUG_ON(obj->madv == __I915_MADV_PURGED);
  
         ret = i915_gem_object_set_to_cpu_domain(obj, true);
-       if (ret) {
+       if (WARN_ON(ret)) {
                 /* In the event of a disaster, abandon all caches and
                  * hope for the best.
                  */
-               WARN_ON(ret != -EIO);
                 i915_gem_clflush_object(obj, true);
                 obj->base.read_domains = obj->base.write_domain = I915_GEM_DOMAIN_CPU;
         }
@@ -2729,8 +2726,11 @@ __i915_gem_request_alloc(struct intel_engine_cs *engine,
  
         *req_out = NULL;
  
-       ret = i915_gem_check_wedge(&dev_priv->gpu_error,
-                                  dev_priv->mm.interruptible);
+       /* ABI: Before userspace accesses the GPU (e.g. execbuffer), report
+        * EIO if the GPU is already wedged, or EAGAIN to drop the struct_mutex
+        * and restart.
+        */
+       ret = i915_gem_check_wedge(reset_counter, dev_priv->mm.interruptible);
         if (ret)
                 return ret;
  
@@ -4165,9 +4165,9 @@ i915_gem_ring_throttle(struct drm_device *dev, struct drm_file *file)
         if (ret)
                 return ret;
  
-       ret = i915_gem_check_wedge(&dev_priv->gpu_error, false);
-       if (ret)
-               return ret;
+       /* ABI: return -EIO if already wedged */
+       if (i915_terminally_wedged(&dev_priv->gpu_error))
+               return -EIO;
  
         spin_lock(&file_priv->mm.lock);
         list_for_each_entry(request, &file_priv->mm.request_list, client_list) {
diff --git a/drivers/gpu/drm/i915/i915_gem_userptr.c b/drivers/gpu/drm/i915/i915_gem_userptr.c

index e6b5938ce6e244064cf2c7a824b4403d8b073e32..32d9726e38b11878915ceef5c9f556fac1910459 100644 (file)
--- a/drivers/gpu/drm/i915/i915_gem_userptr.c
+++ b/drivers/gpu/drm/i915/i915_gem_userptr.c
@@ -112,10 +112,8 @@ static void cancel_userptr(struct work_struct *work)
                 was_interruptible = dev_priv->mm.interruptible;
                 dev_priv->mm.interruptible = false;
  
-               list_for_each_entry_safe(vma, tmp, &obj->vma_list, obj_link) {
-                       int ret = i915_vma_unbind(vma);
-                       WARN_ON(ret && ret != -EIO);
-               }
+               list_for_each_entry_safe(vma, tmp, &obj->vma_list, obj_link)
+                       WARN_ON(i915_vma_unbind(vma));
                 WARN_ON(i915_gem_object_put_pages(obj));
  
                 dev_priv->mm.interruptible = was_interruptible;
diff --git a/drivers/gpu/drm/i915/intel_display.c b/drivers/gpu/drm/i915/intel_display.c

index 6500f77fc78ecaf985d96b3a85b8341436b66da8..b1b457864e17c92acd84bfbef0a51065db600e7e 100644 (file)
--- a/drivers/gpu/drm/i915/intel_display.c
+++ b/drivers/gpu/drm/i915/intel_display.c
@@ -13436,11 +13436,9 @@ static int intel_atomic_prepare_commit(struct drm_device *dev,
  
                         ret = __i915_wait_request(intel_plane_state->wait_req,
                                                   true, NULL, NULL);
-
-                       /* Swallow -EIO errors to allow updates during hw lockup. */
-                       if (ret == -EIO)
-                               ret = 0;
                         if (ret) {
+                               /* Any hang should be swallowed by the wait */
+                               WARN_ON(ret == -EIO);
                                 mutex_lock(&dev->struct_mutex);
                                 drm_atomic_helper_cleanup_planes(dev, state);
                                 mutex_unlock(&dev->struct_mutex);
@@ -13792,10 +13790,11 @@ intel_prepare_plane_fb(struct drm_plane *plane,
                  */
                 if (needs_modeset(crtc_state))
                         ret = i915_gem_object_wait_rendering(old_obj, true);
-
-               /* Swallow -EIO errors to allow updates during hw lockup. */
-               if (ret && ret != -EIO)
+               if (ret) {
+                       /* GPU hangs should have been swallowed by the wait */
+                       WARN_ON(ret == -EIO);
                         return ret;
+               }
         }
  
         /* For framebuffer backed by dmabuf, wait for fence */
diff --git a/drivers/gpu/drm/i915/intel_lrc.c b/drivers/gpu/drm/i915/intel_lrc.c

index 6b0915eefe33a8397d1342874638dc45f01e0dc8..c5dba687f288341977e85bf90577d7a5f45b75e2 100644 (file)
--- a/drivers/gpu/drm/i915/intel_lrc.c
+++ b/drivers/gpu/drm/i915/intel_lrc.c
@@ -1048,7 +1048,7 @@ void intel_logical_ring_stop(struct intel_engine_cs *engine)
                 return;
  
         ret = intel_engine_idle(engine);
-       if (ret && !i915_reset_in_progress_or_wedged(&dev_priv->gpu_error))
+       if (ret)
                 DRM_ERROR("failed to quiesce %s whilst cleaning up: %d\n",
                           engine->name, ret);
  
diff --git a/drivers/gpu/drm/i915/intel_ringbuffer.c b/drivers/gpu/drm/i915/intel_ringbuffer.c

index d9d4a6a41a74900c6cecabc88298a7967ebde624..0b89cf82ba4d4ae7e679e693c7e892f09b79bfd8 100644 (file)
--- a/drivers/gpu/drm/i915/intel_ringbuffer.c
+++ b/drivers/gpu/drm/i915/intel_ringbuffer.c
@@ -3184,8 +3184,7 @@ intel_stop_engine(struct intel_engine_cs *engine)
                 return;
  
         ret = intel_engine_idle(engine);
-       if (ret &&
-           !i915_reset_in_progress_or_wedged(&to_i915(engine->dev)->gpu_error))
+       if (ret)
                 DRM_ERROR("failed to quiesce %s whilst cleaning up: %d\n",
                           engine->name, ret);
author	Chris Wilson <chris@chris-wilson.co.uk>
	Wed, 13 Apr 2016 16:35:08 +0000 (17:35 +0100)
committer	Chris Wilson <chris@chris-wilson.co.uk>
	Thu, 14 Apr 2016 09:45:40 +0000 (10:45 +0100)
drivers/gpu/drm/i915/i915_drv.h		patch \| blob \| history
drivers/gpu/drm/i915/i915_gem.c		patch \| blob \| history
drivers/gpu/drm/i915/i915_gem_userptr.c		patch \| blob \| history
drivers/gpu/drm/i915/intel_display.c		patch \| blob \| history
drivers/gpu/drm/i915/intel_lrc.c		patch \| blob \| history
drivers/gpu/drm/i915/intel_ringbuffer.c		patch \| blob \| history