Commit a7ccb255 authored by Dennis Zhou's avatar Dennis Zhou Committed by David Sterba

btrfs: keep track of which extents have been discarded

Async discard will use the free space cache as backing knowledge for
which extents to discard. This patch plumbs knowledge about which
extents need to be discarded into the free space cache from
unpin_extent_range().

An untrimmed extent can merge with everything as this is a new region.
Absorbing trimmed extents is a tradeoff to for greater coalescing which
makes life better for find_free_extent(). Additionally, it seems the
size of a trim isn't as problematic as the trim io itself.

When reading in the free space cache from disk, if sync is set, mark all
extents as trimmed. The current code ensures at transaction commit that
all free space is trimmed when sync is set, so this reflects that.
Signed-off-by: default avatarDennis Zhou <dennis@kernel.org>
Reviewed-by: default avatarDavid Sterba <dsterba@suse.com>
Signed-off-by: default avatarDavid Sterba <dsterba@suse.com>
parent 46b27f50
...@@ -752,6 +752,14 @@ static int __load_free_space_cache(struct btrfs_root *root, struct inode *inode, ...@@ -752,6 +752,14 @@ static int __load_free_space_cache(struct btrfs_root *root, struct inode *inode,
goto free_cache; goto free_cache;
} }
/*
* Sync discard ensures that the free space cache is always
* trimmed. So when reading this in, the state should reflect
* that.
*/
if (btrfs_test_opt(fs_info, DISCARD_SYNC))
e->trim_state = BTRFS_TRIM_STATE_TRIMMED;
if (!e->bytes) { if (!e->bytes) {
kmem_cache_free(btrfs_free_space_cachep, e); kmem_cache_free(btrfs_free_space_cachep, e);
goto free_cache; goto free_cache;
...@@ -2161,6 +2169,22 @@ static int insert_into_bitmap(struct btrfs_free_space_ctl *ctl, ...@@ -2161,6 +2169,22 @@ static int insert_into_bitmap(struct btrfs_free_space_ctl *ctl,
return ret; return ret;
} }
/*
* Free space merging rules:
* 1) Merge trimmed areas together
* 2) Let untrimmed areas coalesce with trimmed areas
* 3) Always pull neighboring regions from bitmaps
*
* The above rules are for when we merge free space based on btrfs_trim_state.
* Rules 2 and 3 are subtle because they are suboptimal, but are done for the
* same reason: to promote larger extent regions which makes life easier for
* find_free_extent(). Rule 2 enables coalescing based on the common path
* being returning free space from btrfs_finish_extent_commit(). So when free
* space is trimmed, it will prevent aggregating trimmed new region and
* untrimmed regions in the rb_tree. Rule 3 is purely to obtain larger extents
* and provide find_free_extent() with the largest extents possible hoping for
* the reuse path.
*/
static bool try_merge_free_space(struct btrfs_free_space_ctl *ctl, static bool try_merge_free_space(struct btrfs_free_space_ctl *ctl,
struct btrfs_free_space *info, bool update_stat) struct btrfs_free_space *info, bool update_stat)
{ {
...@@ -2169,6 +2193,7 @@ static bool try_merge_free_space(struct btrfs_free_space_ctl *ctl, ...@@ -2169,6 +2193,7 @@ static bool try_merge_free_space(struct btrfs_free_space_ctl *ctl,
bool merged = false; bool merged = false;
u64 offset = info->offset; u64 offset = info->offset;
u64 bytes = info->bytes; u64 bytes = info->bytes;
const bool is_trimmed = btrfs_free_space_trimmed(info);
/* /*
* first we want to see if there is free space adjacent to the range we * first we want to see if there is free space adjacent to the range we
...@@ -2182,7 +2207,9 @@ static bool try_merge_free_space(struct btrfs_free_space_ctl *ctl, ...@@ -2182,7 +2207,9 @@ static bool try_merge_free_space(struct btrfs_free_space_ctl *ctl,
else else
left_info = tree_search_offset(ctl, offset - 1, 0, 0); left_info = tree_search_offset(ctl, offset - 1, 0, 0);
if (right_info && !right_info->bitmap) { /* See try_merge_free_space() comment. */
if (right_info && !right_info->bitmap &&
(!is_trimmed || btrfs_free_space_trimmed(right_info))) {
if (update_stat) if (update_stat)
unlink_free_space(ctl, right_info); unlink_free_space(ctl, right_info);
else else
...@@ -2192,8 +2219,10 @@ static bool try_merge_free_space(struct btrfs_free_space_ctl *ctl, ...@@ -2192,8 +2219,10 @@ static bool try_merge_free_space(struct btrfs_free_space_ctl *ctl,
merged = true; merged = true;
} }
/* See try_merge_free_space() comment. */
if (left_info && !left_info->bitmap && if (left_info && !left_info->bitmap &&
left_info->offset + left_info->bytes == offset) { left_info->offset + left_info->bytes == offset &&
(!is_trimmed || btrfs_free_space_trimmed(left_info))) {
if (update_stat) if (update_stat)
unlink_free_space(ctl, left_info); unlink_free_space(ctl, left_info);
else else
...@@ -2229,6 +2258,10 @@ static bool steal_from_bitmap_to_end(struct btrfs_free_space_ctl *ctl, ...@@ -2229,6 +2258,10 @@ static bool steal_from_bitmap_to_end(struct btrfs_free_space_ctl *ctl,
bytes = (j - i) * ctl->unit; bytes = (j - i) * ctl->unit;
info->bytes += bytes; info->bytes += bytes;
/* See try_merge_free_space() comment. */
if (!btrfs_free_space_trimmed(bitmap))
info->trim_state = BTRFS_TRIM_STATE_UNTRIMMED;
if (update_stat) if (update_stat)
bitmap_clear_bits(ctl, bitmap, end, bytes); bitmap_clear_bits(ctl, bitmap, end, bytes);
else else
...@@ -2282,6 +2315,10 @@ static bool steal_from_bitmap_to_front(struct btrfs_free_space_ctl *ctl, ...@@ -2282,6 +2315,10 @@ static bool steal_from_bitmap_to_front(struct btrfs_free_space_ctl *ctl,
info->offset -= bytes; info->offset -= bytes;
info->bytes += bytes; info->bytes += bytes;
/* See try_merge_free_space() comment. */
if (!btrfs_free_space_trimmed(bitmap))
info->trim_state = BTRFS_TRIM_STATE_UNTRIMMED;
if (update_stat) if (update_stat)
bitmap_clear_bits(ctl, bitmap, info->offset, bytes); bitmap_clear_bits(ctl, bitmap, info->offset, bytes);
else else
...@@ -2331,7 +2368,8 @@ static void steal_from_bitmap(struct btrfs_free_space_ctl *ctl, ...@@ -2331,7 +2368,8 @@ static void steal_from_bitmap(struct btrfs_free_space_ctl *ctl,
int __btrfs_add_free_space(struct btrfs_fs_info *fs_info, int __btrfs_add_free_space(struct btrfs_fs_info *fs_info,
struct btrfs_free_space_ctl *ctl, struct btrfs_free_space_ctl *ctl,
u64 offset, u64 bytes) u64 offset, u64 bytes,
enum btrfs_trim_state trim_state)
{ {
struct btrfs_free_space *info; struct btrfs_free_space *info;
int ret = 0; int ret = 0;
...@@ -2342,6 +2380,7 @@ int __btrfs_add_free_space(struct btrfs_fs_info *fs_info, ...@@ -2342,6 +2380,7 @@ int __btrfs_add_free_space(struct btrfs_fs_info *fs_info,
info->offset = offset; info->offset = offset;
info->bytes = bytes; info->bytes = bytes;
info->trim_state = trim_state;
RB_CLEAR_NODE(&info->offset_index); RB_CLEAR_NODE(&info->offset_index);
spin_lock(&ctl->tree_lock); spin_lock(&ctl->tree_lock);
...@@ -2387,9 +2426,14 @@ int __btrfs_add_free_space(struct btrfs_fs_info *fs_info, ...@@ -2387,9 +2426,14 @@ int __btrfs_add_free_space(struct btrfs_fs_info *fs_info,
int btrfs_add_free_space(struct btrfs_block_group *block_group, int btrfs_add_free_space(struct btrfs_block_group *block_group,
u64 bytenr, u64 size) u64 bytenr, u64 size)
{ {
enum btrfs_trim_state trim_state = BTRFS_TRIM_STATE_UNTRIMMED;
if (btrfs_test_opt(block_group->fs_info, DISCARD_SYNC))
trim_state = BTRFS_TRIM_STATE_TRIMMED;
return __btrfs_add_free_space(block_group->fs_info, return __btrfs_add_free_space(block_group->fs_info,
block_group->free_space_ctl, block_group->free_space_ctl,
bytenr, size); bytenr, size, trim_state);
} }
int btrfs_remove_free_space(struct btrfs_block_group *block_group, int btrfs_remove_free_space(struct btrfs_block_group *block_group,
...@@ -2464,8 +2508,10 @@ int btrfs_remove_free_space(struct btrfs_block_group *block_group, ...@@ -2464,8 +2508,10 @@ int btrfs_remove_free_space(struct btrfs_block_group *block_group,
} }
spin_unlock(&ctl->tree_lock); spin_unlock(&ctl->tree_lock);
ret = btrfs_add_free_space(block_group, offset + bytes, ret = __btrfs_add_free_space(block_group->fs_info, ctl,
old_end - (offset + bytes)); offset + bytes,
old_end - (offset + bytes),
info->trim_state);
WARN_ON(ret); WARN_ON(ret);
goto out; goto out;
} }
...@@ -2634,6 +2680,7 @@ u64 btrfs_find_space_for_alloc(struct btrfs_block_group *block_group, ...@@ -2634,6 +2680,7 @@ u64 btrfs_find_space_for_alloc(struct btrfs_block_group *block_group,
u64 ret = 0; u64 ret = 0;
u64 align_gap = 0; u64 align_gap = 0;
u64 align_gap_len = 0; u64 align_gap_len = 0;
enum btrfs_trim_state align_gap_trim_state = BTRFS_TRIM_STATE_UNTRIMMED;
spin_lock(&ctl->tree_lock); spin_lock(&ctl->tree_lock);
entry = find_free_space(ctl, &offset, &bytes_search, entry = find_free_space(ctl, &offset, &bytes_search,
...@@ -2650,6 +2697,7 @@ u64 btrfs_find_space_for_alloc(struct btrfs_block_group *block_group, ...@@ -2650,6 +2697,7 @@ u64 btrfs_find_space_for_alloc(struct btrfs_block_group *block_group,
unlink_free_space(ctl, entry); unlink_free_space(ctl, entry);
align_gap_len = offset - entry->offset; align_gap_len = offset - entry->offset;
align_gap = entry->offset; align_gap = entry->offset;
align_gap_trim_state = entry->trim_state;
entry->offset = offset + bytes; entry->offset = offset + bytes;
WARN_ON(entry->bytes < bytes + align_gap_len); WARN_ON(entry->bytes < bytes + align_gap_len);
...@@ -2665,7 +2713,8 @@ u64 btrfs_find_space_for_alloc(struct btrfs_block_group *block_group, ...@@ -2665,7 +2713,8 @@ u64 btrfs_find_space_for_alloc(struct btrfs_block_group *block_group,
if (align_gap_len) if (align_gap_len)
__btrfs_add_free_space(block_group->fs_info, ctl, __btrfs_add_free_space(block_group->fs_info, ctl,
align_gap, align_gap_len); align_gap, align_gap_len,
align_gap_trim_state);
return ret; return ret;
} }
......
...@@ -6,6 +6,14 @@ ...@@ -6,6 +6,14 @@
#ifndef BTRFS_FREE_SPACE_CACHE_H #ifndef BTRFS_FREE_SPACE_CACHE_H
#define BTRFS_FREE_SPACE_CACHE_H #define BTRFS_FREE_SPACE_CACHE_H
/*
* This is the trim state of an extent or bitmap.
*/
enum btrfs_trim_state {
BTRFS_TRIM_STATE_UNTRIMMED,
BTRFS_TRIM_STATE_TRIMMED,
};
struct btrfs_free_space { struct btrfs_free_space {
struct rb_node offset_index; struct rb_node offset_index;
u64 offset; u64 offset;
...@@ -13,8 +21,14 @@ struct btrfs_free_space { ...@@ -13,8 +21,14 @@ struct btrfs_free_space {
u64 max_extent_size; u64 max_extent_size;
unsigned long *bitmap; unsigned long *bitmap;
struct list_head list; struct list_head list;
enum btrfs_trim_state trim_state;
}; };
static inline bool btrfs_free_space_trimmed(struct btrfs_free_space *info)
{
return (info->trim_state == BTRFS_TRIM_STATE_TRIMMED);
}
struct btrfs_free_space_ctl { struct btrfs_free_space_ctl {
spinlock_t tree_lock; spinlock_t tree_lock;
struct rb_root free_space_offset; struct rb_root free_space_offset;
...@@ -83,7 +97,8 @@ int btrfs_write_out_ino_cache(struct btrfs_root *root, ...@@ -83,7 +97,8 @@ int btrfs_write_out_ino_cache(struct btrfs_root *root,
void btrfs_init_free_space_ctl(struct btrfs_block_group *block_group); void btrfs_init_free_space_ctl(struct btrfs_block_group *block_group);
int __btrfs_add_free_space(struct btrfs_fs_info *fs_info, int __btrfs_add_free_space(struct btrfs_fs_info *fs_info,
struct btrfs_free_space_ctl *ctl, struct btrfs_free_space_ctl *ctl,
u64 bytenr, u64 size); u64 bytenr, u64 size,
enum btrfs_trim_state trim_state);
int btrfs_add_free_space(struct btrfs_block_group *block_group, int btrfs_add_free_space(struct btrfs_block_group *block_group,
u64 bytenr, u64 size); u64 bytenr, u64 size);
int btrfs_remove_free_space(struct btrfs_block_group *block_group, int btrfs_remove_free_space(struct btrfs_block_group *block_group,
......
...@@ -107,7 +107,7 @@ static int caching_kthread(void *data) ...@@ -107,7 +107,7 @@ static int caching_kthread(void *data)
if (last != (u64)-1 && last + 1 != key.objectid) { if (last != (u64)-1 && last + 1 != key.objectid) {
__btrfs_add_free_space(fs_info, ctl, last + 1, __btrfs_add_free_space(fs_info, ctl, last + 1,
key.objectid - last - 1); key.objectid - last - 1, 0);
wake_up(&root->ino_cache_wait); wake_up(&root->ino_cache_wait);
} }
...@@ -118,7 +118,7 @@ static int caching_kthread(void *data) ...@@ -118,7 +118,7 @@ static int caching_kthread(void *data)
if (last < root->highest_objectid - 1) { if (last < root->highest_objectid - 1) {
__btrfs_add_free_space(fs_info, ctl, last + 1, __btrfs_add_free_space(fs_info, ctl, last + 1,
root->highest_objectid - last - 1); root->highest_objectid - last - 1, 0);
} }
spin_lock(&root->ino_cache_lock); spin_lock(&root->ino_cache_lock);
...@@ -175,7 +175,8 @@ static void start_caching(struct btrfs_root *root) ...@@ -175,7 +175,8 @@ static void start_caching(struct btrfs_root *root)
ret = btrfs_find_free_objectid(root, &objectid); ret = btrfs_find_free_objectid(root, &objectid);
if (!ret && objectid <= BTRFS_LAST_FREE_OBJECTID) { if (!ret && objectid <= BTRFS_LAST_FREE_OBJECTID) {
__btrfs_add_free_space(fs_info, ctl, objectid, __btrfs_add_free_space(fs_info, ctl, objectid,
BTRFS_LAST_FREE_OBJECTID - objectid + 1); BTRFS_LAST_FREE_OBJECTID - objectid + 1,
0);
wake_up(&root->ino_cache_wait); wake_up(&root->ino_cache_wait);
} }
...@@ -221,7 +222,7 @@ void btrfs_return_ino(struct btrfs_root *root, u64 objectid) ...@@ -221,7 +222,7 @@ void btrfs_return_ino(struct btrfs_root *root, u64 objectid)
return; return;
again: again:
if (root->ino_cache_state == BTRFS_CACHE_FINISHED) { if (root->ino_cache_state == BTRFS_CACHE_FINISHED) {
__btrfs_add_free_space(fs_info, pinned, objectid, 1); __btrfs_add_free_space(fs_info, pinned, objectid, 1, 0);
} else { } else {
down_write(&fs_info->commit_root_sem); down_write(&fs_info->commit_root_sem);
spin_lock(&root->ino_cache_lock); spin_lock(&root->ino_cache_lock);
...@@ -234,7 +235,7 @@ void btrfs_return_ino(struct btrfs_root *root, u64 objectid) ...@@ -234,7 +235,7 @@ void btrfs_return_ino(struct btrfs_root *root, u64 objectid)
start_caching(root); start_caching(root);
__btrfs_add_free_space(fs_info, pinned, objectid, 1); __btrfs_add_free_space(fs_info, pinned, objectid, 1, 0);
up_write(&fs_info->commit_root_sem); up_write(&fs_info->commit_root_sem);
} }
...@@ -281,7 +282,7 @@ void btrfs_unpin_free_ino(struct btrfs_root *root) ...@@ -281,7 +282,7 @@ void btrfs_unpin_free_ino(struct btrfs_root *root)
spin_unlock(rbroot_lock); spin_unlock(rbroot_lock);
if (count) if (count)
__btrfs_add_free_space(root->fs_info, ctl, __btrfs_add_free_space(root->fs_info, ctl,
info->offset, count); info->offset, count, 0);
kmem_cache_free(btrfs_free_space_cachep, info); kmem_cache_free(btrfs_free_space_cachep, info);
} }
} }
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment