Commit ea4ebde0 authored by Chris Mason's avatar Chris Mason

Btrfs: fix deadlocks with trylock on tree nodes

The Btrfs tree trylock function is poorly named.  It always takes
the spinlock and backs off if the blocking lock is held.  This
can lead to surprising lockups because people expect it to really be a
trylock.

This commit makes it a pure trylock, both for the spinlock and the
blocking lock.  It also reworks the nested lock handling slightly to
avoid taking the read lock while a spinning write lock might be held.
Signed-off-by: default avatarChris Mason <clm@fb.com>
parent 47a306a7
...@@ -33,14 +33,14 @@ static void btrfs_assert_tree_read_locked(struct extent_buffer *eb); ...@@ -33,14 +33,14 @@ static void btrfs_assert_tree_read_locked(struct extent_buffer *eb);
*/ */
void btrfs_set_lock_blocking_rw(struct extent_buffer *eb, int rw) void btrfs_set_lock_blocking_rw(struct extent_buffer *eb, int rw)
{ {
if (eb->lock_nested) { /*
read_lock(&eb->lock); * no lock is required. The lock owner may change if
if (eb->lock_nested && current->pid == eb->lock_owner) { * we have a read lock, but it won't change to or away
read_unlock(&eb->lock); * from us. If we have the write lock, we are the owner
return; * and it'll never change.
} */
read_unlock(&eb->lock); if (eb->lock_nested && current->pid == eb->lock_owner)
} return;
if (rw == BTRFS_WRITE_LOCK) { if (rw == BTRFS_WRITE_LOCK) {
if (atomic_read(&eb->blocking_writers) == 0) { if (atomic_read(&eb->blocking_writers) == 0) {
WARN_ON(atomic_read(&eb->spinning_writers) != 1); WARN_ON(atomic_read(&eb->spinning_writers) != 1);
...@@ -65,14 +65,15 @@ void btrfs_set_lock_blocking_rw(struct extent_buffer *eb, int rw) ...@@ -65,14 +65,15 @@ void btrfs_set_lock_blocking_rw(struct extent_buffer *eb, int rw)
*/ */
void btrfs_clear_lock_blocking_rw(struct extent_buffer *eb, int rw) void btrfs_clear_lock_blocking_rw(struct extent_buffer *eb, int rw)
{ {
if (eb->lock_nested) { /*
read_lock(&eb->lock); * no lock is required. The lock owner may change if
if (eb->lock_nested && current->pid == eb->lock_owner) { * we have a read lock, but it won't change to or away
read_unlock(&eb->lock); * from us. If we have the write lock, we are the owner
return; * and it'll never change.
} */
read_unlock(&eb->lock); if (eb->lock_nested && current->pid == eb->lock_owner)
} return;
if (rw == BTRFS_WRITE_LOCK_BLOCKING) { if (rw == BTRFS_WRITE_LOCK_BLOCKING) {
BUG_ON(atomic_read(&eb->blocking_writers) != 1); BUG_ON(atomic_read(&eb->blocking_writers) != 1);
write_lock(&eb->lock); write_lock(&eb->lock);
...@@ -99,6 +100,9 @@ void btrfs_clear_lock_blocking_rw(struct extent_buffer *eb, int rw) ...@@ -99,6 +100,9 @@ void btrfs_clear_lock_blocking_rw(struct extent_buffer *eb, int rw)
void btrfs_tree_read_lock(struct extent_buffer *eb) void btrfs_tree_read_lock(struct extent_buffer *eb)
{ {
again: again:
BUG_ON(!atomic_read(&eb->blocking_writers) &&
current->pid == eb->lock_owner);
read_lock(&eb->lock); read_lock(&eb->lock);
if (atomic_read(&eb->blocking_writers) && if (atomic_read(&eb->blocking_writers) &&
current->pid == eb->lock_owner) { current->pid == eb->lock_owner) {
...@@ -132,7 +136,9 @@ int btrfs_try_tree_read_lock(struct extent_buffer *eb) ...@@ -132,7 +136,9 @@ int btrfs_try_tree_read_lock(struct extent_buffer *eb)
if (atomic_read(&eb->blocking_writers)) if (atomic_read(&eb->blocking_writers))
return 0; return 0;
read_lock(&eb->lock); if (!read_trylock(&eb->lock))
return 0;
if (atomic_read(&eb->blocking_writers)) { if (atomic_read(&eb->blocking_writers)) {
read_unlock(&eb->lock); read_unlock(&eb->lock);
return 0; return 0;
...@@ -151,7 +157,10 @@ int btrfs_try_tree_write_lock(struct extent_buffer *eb) ...@@ -151,7 +157,10 @@ int btrfs_try_tree_write_lock(struct extent_buffer *eb)
if (atomic_read(&eb->blocking_writers) || if (atomic_read(&eb->blocking_writers) ||
atomic_read(&eb->blocking_readers)) atomic_read(&eb->blocking_readers))
return 0; return 0;
write_lock(&eb->lock);
if (!write_trylock(&eb->lock))
return 0;
if (atomic_read(&eb->blocking_writers) || if (atomic_read(&eb->blocking_writers) ||
atomic_read(&eb->blocking_readers)) { atomic_read(&eb->blocking_readers)) {
write_unlock(&eb->lock); write_unlock(&eb->lock);
...@@ -168,14 +177,15 @@ int btrfs_try_tree_write_lock(struct extent_buffer *eb) ...@@ -168,14 +177,15 @@ int btrfs_try_tree_write_lock(struct extent_buffer *eb)
*/ */
void btrfs_tree_read_unlock(struct extent_buffer *eb) void btrfs_tree_read_unlock(struct extent_buffer *eb)
{ {
if (eb->lock_nested) { /*
read_lock(&eb->lock); * if we're nested, we have the write lock. No new locking
if (eb->lock_nested && current->pid == eb->lock_owner) { * is needed as long as we are the lock owner.
eb->lock_nested = 0; * The write unlock will do a barrier for us, and the lock_nested
read_unlock(&eb->lock); * field only matters to the lock owner.
return; */
} if (eb->lock_nested && current->pid == eb->lock_owner) {
read_unlock(&eb->lock); eb->lock_nested = 0;
return;
} }
btrfs_assert_tree_read_locked(eb); btrfs_assert_tree_read_locked(eb);
WARN_ON(atomic_read(&eb->spinning_readers) == 0); WARN_ON(atomic_read(&eb->spinning_readers) == 0);
...@@ -189,14 +199,15 @@ void btrfs_tree_read_unlock(struct extent_buffer *eb) ...@@ -189,14 +199,15 @@ void btrfs_tree_read_unlock(struct extent_buffer *eb)
*/ */
void btrfs_tree_read_unlock_blocking(struct extent_buffer *eb) void btrfs_tree_read_unlock_blocking(struct extent_buffer *eb)
{ {
if (eb->lock_nested) { /*
read_lock(&eb->lock); * if we're nested, we have the write lock. No new locking
if (eb->lock_nested && current->pid == eb->lock_owner) { * is needed as long as we are the lock owner.
eb->lock_nested = 0; * The write unlock will do a barrier for us, and the lock_nested
read_unlock(&eb->lock); * field only matters to the lock owner.
return; */
} if (eb->lock_nested && current->pid == eb->lock_owner) {
read_unlock(&eb->lock); eb->lock_nested = 0;
return;
} }
btrfs_assert_tree_read_locked(eb); btrfs_assert_tree_read_locked(eb);
WARN_ON(atomic_read(&eb->blocking_readers) == 0); WARN_ON(atomic_read(&eb->blocking_readers) == 0);
...@@ -244,6 +255,7 @@ void btrfs_tree_unlock(struct extent_buffer *eb) ...@@ -244,6 +255,7 @@ void btrfs_tree_unlock(struct extent_buffer *eb)
BUG_ON(blockers > 1); BUG_ON(blockers > 1);
btrfs_assert_tree_locked(eb); btrfs_assert_tree_locked(eb);
eb->lock_owner = 0;
atomic_dec(&eb->write_locks); atomic_dec(&eb->write_locks);
if (blockers) { if (blockers) {
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment