Commit 3e9fd94f authored by Chris Mason's avatar Chris Mason

Btrfs: Avoid fragmentation from parallel delalloc filling

Signed-off-by: default avatarChris Mason <chris.mason@oracle.com>
parent 2f4cbe64
...@@ -1033,11 +1033,11 @@ int find_first_extent_bit(struct extent_map_tree *tree, u64 start, ...@@ -1033,11 +1033,11 @@ int find_first_extent_bit(struct extent_map_tree *tree, u64 start,
EXPORT_SYMBOL(find_first_extent_bit); EXPORT_SYMBOL(find_first_extent_bit);
u64 find_lock_delalloc_range(struct extent_map_tree *tree, u64 find_lock_delalloc_range(struct extent_map_tree *tree,
u64 start, u64 lock_start, u64 *end, u64 max_bytes) u64 *start, u64 *end, u64 max_bytes)
{ {
struct rb_node *node; struct rb_node *node;
struct extent_state *state; struct extent_state *state;
u64 cur_start = start; u64 cur_start = *start;
u64 found = 0; u64 found = 0;
u64 total_bytes = 0; u64 total_bytes = 0;
...@@ -1054,27 +1054,43 @@ u64 find_lock_delalloc_range(struct extent_map_tree *tree, ...@@ -1054,27 +1054,43 @@ u64 find_lock_delalloc_range(struct extent_map_tree *tree,
while(1) { while(1) {
state = rb_entry(node, struct extent_state, rb_node); state = rb_entry(node, struct extent_state, rb_node);
if (state->start != cur_start) { if (found && state->start != cur_start) {
goto out; goto out;
} }
if (!(state->state & EXTENT_DELALLOC)) { if (!(state->state & EXTENT_DELALLOC)) {
goto out; goto out;
} }
if (state->start >= lock_start) { if (!found) {
if (state->state & EXTENT_LOCKED) { struct extent_state *prev_state;
DEFINE_WAIT(wait); struct rb_node *prev_node = node;
atomic_inc(&state->refs); while(1) {
prepare_to_wait(&state->wq, &wait, prev_node = rb_prev(prev_node);
TASK_UNINTERRUPTIBLE); if (!prev_node)
write_unlock_irq(&tree->lock); break;
schedule(); prev_state = rb_entry(prev_node,
write_lock_irq(&tree->lock); struct extent_state,
finish_wait(&state->wq, &wait); rb_node);
free_extent_state(state); if (!(prev_state->state & EXTENT_DELALLOC))
goto search_again; break;
state = prev_state;
node = prev_node;
} }
state->state |= EXTENT_LOCKED;
} }
if (state->state & EXTENT_LOCKED) {
DEFINE_WAIT(wait);
atomic_inc(&state->refs);
prepare_to_wait(&state->wq, &wait,
TASK_UNINTERRUPTIBLE);
write_unlock_irq(&tree->lock);
schedule();
write_lock_irq(&tree->lock);
finish_wait(&state->wq, &wait);
free_extent_state(state);
goto search_again;
}
state->state |= EXTENT_LOCKED;
if (!found)
*start = state->start;
found++; found++;
*end = state->end; *end = state->end;
cur_start = state->end + 1; cur_start = state->end + 1;
...@@ -1695,6 +1711,7 @@ static int __extent_writepage(struct page *page, struct writeback_control *wbc, ...@@ -1695,6 +1711,7 @@ static int __extent_writepage(struct page *page, struct writeback_control *wbc,
struct extent_page_data *epd = data; struct extent_page_data *epd = data;
struct extent_map_tree *tree = epd->tree; struct extent_map_tree *tree = epd->tree;
u64 start = (u64)page->index << PAGE_CACHE_SHIFT; u64 start = (u64)page->index << PAGE_CACHE_SHIFT;
u64 delalloc_start;
u64 page_end = start + PAGE_CACHE_SIZE - 1; u64 page_end = start + PAGE_CACHE_SIZE - 1;
u64 end; u64 end;
u64 cur = start; u64 cur = start;
...@@ -1729,25 +1746,23 @@ static int __extent_writepage(struct page *page, struct writeback_control *wbc, ...@@ -1729,25 +1746,23 @@ static int __extent_writepage(struct page *page, struct writeback_control *wbc,
set_page_extent_mapped(page); set_page_extent_mapped(page);
lock_extent(tree, start, page_end, GFP_NOFS); delalloc_start = start;
nr_delalloc = find_lock_delalloc_range(tree, start, page_end + 1, delalloc_end = 0;
&delalloc_end, while(delalloc_end < page_end) {
128 * 1024 * 1024); nr_delalloc = find_lock_delalloc_range(tree, &delalloc_start,
if (nr_delalloc) { &delalloc_end,
tree->ops->fill_delalloc(inode, start, delalloc_end); 128 * 1024 * 1024);
if (delalloc_end >= page_end + 1) { if (nr_delalloc <= 0)
clear_extent_bit(tree, page_end + 1, delalloc_end, break;
EXTENT_LOCKED | EXTENT_DELALLOC, tree->ops->fill_delalloc(inode, delalloc_start,
1, 0, GFP_NOFS); delalloc_end);
} clear_extent_bit(tree, delalloc_start,
clear_extent_bit(tree, start, page_end, EXTENT_DELALLOC, delalloc_end,
0, 0, GFP_NOFS); EXTENT_LOCKED | EXTENT_DELALLOC,
if (test_range_bit(tree, start, page_end, EXTENT_DELALLOC, 0)) { 1, 0, GFP_NOFS);
printk("found delalloc bits after clear extent_bit\n"); delalloc_start = delalloc_end + 1;
}
} else if (test_range_bit(tree, start, page_end, EXTENT_DELALLOC, 0)) {
printk("found delalloc bits after find_delalloc_range returns 0\n");
} }
lock_extent(tree, start, page_end, GFP_NOFS);
end = page_end; end = page_end;
if (test_range_bit(tree, start, page_end, EXTENT_DELALLOC, 0)) { if (test_range_bit(tree, start, page_end, EXTENT_DELALLOC, 0)) {
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment