Commit 9700a1df authored by Matthew Auld's avatar Matthew Auld Committed by Rodrigo Vivi

drm/xe: add lockdep annotation for xe_device_mem_access_put()

The main motivation is with d3cold which will make the suspend and
resume callbacks even more scary, but is useful regardless. We already
have the needed annotation on the acquire side with
xe_device_mem_access_get(), and by adding the annotation on the release
side we should have a lot more confidence that our locking hierarchy is
correct.

v2:
  - Move the annotation into both callbacks for better symmetry. Also
    don't hold over the entire mem_access_get(); we only need to lockep
    to understand what is being held upon entering mem_access_get(), and
    how that matches up with locks in the callbacks.
Signed-off-by: default avatarMatthew Auld <matthew.auld@intel.com>
Cc: Thomas Hellström <thomas.hellstrom@linux.intel.com>
Cc: Anshuman Gupta <anshuman.gupta@intel.com>
Cc: Rodrigo Vivi <rodrigo.vivi@intel.com>
Reviewed-by: default avatarRodrigo Vivi <rodrigo.vivi@intel.com>
Signed-off-by: default avatarRodrigo Vivi <rodrigo.vivi@intel.com>
parent 7ead3315
...@@ -35,7 +35,7 @@ ...@@ -35,7 +35,7 @@
#include "xe_wait_user_fence.h" #include "xe_wait_user_fence.h"
#ifdef CONFIG_LOCKDEP #ifdef CONFIG_LOCKDEP
static struct lockdep_map xe_device_mem_access_lockdep_map = { struct lockdep_map xe_device_mem_access_lockdep_map = {
.name = "xe_device_mem_access_lockdep_map" .name = "xe_device_mem_access_lockdep_map"
}; };
#endif #endif
...@@ -431,13 +431,13 @@ void xe_device_mem_access_get(struct xe_device *xe) ...@@ -431,13 +431,13 @@ void xe_device_mem_access_get(struct xe_device *xe)
* runtime_resume callback, lockdep should give us a nice splat. * runtime_resume callback, lockdep should give us a nice splat.
*/ */
lock_map_acquire(&xe_device_mem_access_lockdep_map); lock_map_acquire(&xe_device_mem_access_lockdep_map);
lock_map_release(&xe_device_mem_access_lockdep_map);
xe_pm_runtime_get(xe); xe_pm_runtime_get(xe);
ref = atomic_inc_return(&xe->mem_access.ref); ref = atomic_inc_return(&xe->mem_access.ref);
XE_WARN_ON(ref == S32_MAX); XE_WARN_ON(ref == S32_MAX);
lock_map_release(&xe_device_mem_access_lockdep_map);
} }
void xe_device_mem_access_put(struct xe_device *xe) void xe_device_mem_access_put(struct xe_device *xe)
......
...@@ -16,6 +16,10 @@ struct xe_file; ...@@ -16,6 +16,10 @@ struct xe_file;
#include "xe_force_wake.h" #include "xe_force_wake.h"
#include "xe_macros.h" #include "xe_macros.h"
#ifdef CONFIG_LOCKDEP
extern struct lockdep_map xe_device_mem_access_lockdep_map;
#endif
static inline struct xe_device *to_xe_device(const struct drm_device *dev) static inline struct xe_device *to_xe_device(const struct drm_device *dev)
{ {
return container_of(dev, struct xe_device, drm); return container_of(dev, struct xe_device, drm);
......
...@@ -188,6 +188,29 @@ int xe_pm_runtime_suspend(struct xe_device *xe) ...@@ -188,6 +188,29 @@ int xe_pm_runtime_suspend(struct xe_device *xe)
/* Disable access_ongoing asserts and prevent recursive pm calls */ /* Disable access_ongoing asserts and prevent recursive pm calls */
xe_pm_write_callback_task(xe, current); xe_pm_write_callback_task(xe, current);
/*
* The actual xe_device_mem_access_put() is always async underneath, so
* exactly where that is called should makes no difference to us. However
* we still need to be very careful with the locks that this callback
* acquires and the locks that are acquired and held by any callers of
* xe_device_mem_access_get(). We already have the matching annotation
* on that side, but we also need it here. For example lockdep should be
* able to tell us if the following scenario is in theory possible:
*
* CPU0 | CPU1 (kworker)
* lock(A) |
* | xe_pm_runtime_suspend()
* | lock(A)
* xe_device_mem_access_get() |
*
* This will clearly deadlock since rpm core needs to wait for
* xe_pm_runtime_suspend() to complete, but here we are holding lock(A)
* on CPU0 which prevents CPU1 making forward progress. With the
* annotation here and in xe_device_mem_access_get() lockdep will see
* the potential lock inversion and give us a nice splat.
*/
lock_map_acquire(&xe_device_mem_access_lockdep_map);
if (xe->d3cold.allowed) { if (xe->d3cold.allowed) {
err = xe_bo_evict_all(xe); err = xe_bo_evict_all(xe);
if (err) if (err)
...@@ -202,6 +225,7 @@ int xe_pm_runtime_suspend(struct xe_device *xe) ...@@ -202,6 +225,7 @@ int xe_pm_runtime_suspend(struct xe_device *xe)
xe_irq_suspend(xe); xe_irq_suspend(xe);
out: out:
lock_map_release(&xe_device_mem_access_lockdep_map);
xe_pm_write_callback_task(xe, NULL); xe_pm_write_callback_task(xe, NULL);
return err; return err;
} }
...@@ -215,6 +239,8 @@ int xe_pm_runtime_resume(struct xe_device *xe) ...@@ -215,6 +239,8 @@ int xe_pm_runtime_resume(struct xe_device *xe)
/* Disable access_ongoing asserts and prevent recursive pm calls */ /* Disable access_ongoing asserts and prevent recursive pm calls */
xe_pm_write_callback_task(xe, current); xe_pm_write_callback_task(xe, current);
lock_map_acquire(&xe_device_mem_access_lockdep_map);
/* /*
* It can be possible that xe has allowed d3cold but other pcie devices * It can be possible that xe has allowed d3cold but other pcie devices
* in gfx card soc would have blocked d3cold, therefore card has not * in gfx card soc would have blocked d3cold, therefore card has not
...@@ -250,6 +276,7 @@ int xe_pm_runtime_resume(struct xe_device *xe) ...@@ -250,6 +276,7 @@ int xe_pm_runtime_resume(struct xe_device *xe)
goto out; goto out;
} }
out: out:
lock_map_release(&xe_device_mem_access_lockdep_map);
xe_pm_write_callback_task(xe, NULL); xe_pm_write_callback_task(xe, NULL);
return err; return err;
} }
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment