Commit c45c8667 authored by Kent Overstreet's avatar Kent Overstreet Committed by Kent Overstreet

bcachefs: bch2_gc_gens() no longer uses bucket array

Like the previous patches, this converts bch2_gc_gens() to use the alloc
btree directly, and private arrays of generation numbers for its own
recalculation of oldest_gen.
Signed-off-by: default avatarKent Overstreet <kent.overstreet@gmail.com>
parent d73e0d2c
...@@ -452,6 +452,7 @@ struct bch_dev { ...@@ -452,6 +452,7 @@ struct bch_dev {
*/ */
struct bucket_array __rcu *buckets[2]; struct bucket_array __rcu *buckets[2];
struct bucket_gens __rcu *bucket_gens; struct bucket_gens __rcu *bucket_gens;
u8 *oldest_gen;
unsigned long *buckets_nouse; unsigned long *buckets_nouse;
struct rw_semaphore bucket_lock; struct rw_semaphore bucket_lock;
...@@ -806,6 +807,7 @@ struct bch_fs { ...@@ -806,6 +807,7 @@ struct bch_fs {
* it's not while a gc is in progress. * it's not while a gc is in progress.
*/ */
struct rw_semaphore gc_lock; struct rw_semaphore gc_lock;
struct mutex gc_gens_lock;
/* IO PATH */ /* IO PATH */
struct semaphore io_in_flight; struct semaphore io_in_flight;
......
...@@ -1787,9 +1787,8 @@ static bool gc_btree_gens_key(struct bch_fs *c, struct bkey_s_c k) ...@@ -1787,9 +1787,8 @@ static bool gc_btree_gens_key(struct bch_fs *c, struct bkey_s_c k)
percpu_down_read(&c->mark_lock); percpu_down_read(&c->mark_lock);
bkey_for_each_ptr(ptrs, ptr) { bkey_for_each_ptr(ptrs, ptr) {
struct bch_dev *ca = bch_dev_bkey_exists(c, ptr->dev); struct bch_dev *ca = bch_dev_bkey_exists(c, ptr->dev);
struct bucket *g = PTR_BUCKET(ca, ptr);
if (gen_after(g->mark.gen, ptr->gen) > 16) { if (ptr_stale(ca, ptr) > 16) {
percpu_up_read(&c->mark_lock); percpu_up_read(&c->mark_lock);
return true; return true;
} }
...@@ -1797,10 +1796,10 @@ static bool gc_btree_gens_key(struct bch_fs *c, struct bkey_s_c k) ...@@ -1797,10 +1796,10 @@ static bool gc_btree_gens_key(struct bch_fs *c, struct bkey_s_c k)
bkey_for_each_ptr(ptrs, ptr) { bkey_for_each_ptr(ptrs, ptr) {
struct bch_dev *ca = bch_dev_bkey_exists(c, ptr->dev); struct bch_dev *ca = bch_dev_bkey_exists(c, ptr->dev);
struct bucket *g = PTR_BUCKET(ca, ptr); u8 *gen = &ca->oldest_gen[PTR_BUCKET_NR(ca, ptr)];
if (gen_after(g->gc_gen, ptr->gen)) if (gen_after(*gen, ptr->gen))
g->gc_gen = ptr->gen; *gen = ptr->gen;
} }
percpu_up_read(&c->mark_lock); percpu_up_read(&c->mark_lock);
...@@ -1811,23 +1810,22 @@ static bool gc_btree_gens_key(struct bch_fs *c, struct bkey_s_c k) ...@@ -1811,23 +1810,22 @@ static bool gc_btree_gens_key(struct bch_fs *c, struct bkey_s_c k)
* For recalculating oldest gen, we only need to walk keys in leaf nodes; btree * For recalculating oldest gen, we only need to walk keys in leaf nodes; btree
* node pointers currently never have cached pointers that can become stale: * node pointers currently never have cached pointers that can become stale:
*/ */
static int bch2_gc_btree_gens(struct bch_fs *c, enum btree_id btree_id) static int bch2_gc_btree_gens(struct btree_trans *trans, enum btree_id btree_id)
{ {
struct btree_trans trans; struct bch_fs *c = trans->c;
struct btree_iter iter; struct btree_iter iter;
struct bkey_s_c k; struct bkey_s_c k;
struct bkey_buf sk; struct bkey_buf sk;
int ret = 0, commit_err = 0; int ret = 0, commit_err = 0;
bch2_bkey_buf_init(&sk); bch2_bkey_buf_init(&sk);
bch2_trans_init(&trans, c, 0, 0);
bch2_trans_iter_init(&trans, &iter, btree_id, POS_MIN, bch2_trans_iter_init(trans, &iter, btree_id, POS_MIN,
BTREE_ITER_PREFETCH| BTREE_ITER_PREFETCH|
BTREE_ITER_NOT_EXTENTS| BTREE_ITER_NOT_EXTENTS|
BTREE_ITER_ALL_SNAPSHOTS); BTREE_ITER_ALL_SNAPSHOTS);
while ((bch2_trans_begin(&trans), while ((bch2_trans_begin(trans),
k = bch2_btree_iter_peek(&iter)).k) { k = bch2_btree_iter_peek(&iter)).k) {
ret = bkey_err(k); ret = bkey_err(k);
...@@ -1843,8 +1841,8 @@ static int bch2_gc_btree_gens(struct bch_fs *c, enum btree_id btree_id) ...@@ -1843,8 +1841,8 @@ static int bch2_gc_btree_gens(struct bch_fs *c, enum btree_id btree_id)
bch2_extent_normalize(c, bkey_i_to_s(sk.k)); bch2_extent_normalize(c, bkey_i_to_s(sk.k));
commit_err = commit_err =
bch2_trans_update(&trans, &iter, sk.k, 0) ?: bch2_trans_update(trans, &iter, sk.k, 0) ?:
bch2_trans_commit(&trans, NULL, NULL, bch2_trans_commit(trans, NULL, NULL,
BTREE_INSERT_NOWAIT| BTREE_INSERT_NOWAIT|
BTREE_INSERT_NOFAIL); BTREE_INSERT_NOFAIL);
if (commit_err == -EINTR) { if (commit_err == -EINTR) {
...@@ -1855,20 +1853,42 @@ static int bch2_gc_btree_gens(struct bch_fs *c, enum btree_id btree_id) ...@@ -1855,20 +1853,42 @@ static int bch2_gc_btree_gens(struct bch_fs *c, enum btree_id btree_id)
bch2_btree_iter_advance(&iter); bch2_btree_iter_advance(&iter);
} }
bch2_trans_iter_exit(&trans, &iter); bch2_trans_iter_exit(trans, &iter);
bch2_trans_exit(&trans);
bch2_bkey_buf_exit(&sk, c); bch2_bkey_buf_exit(&sk, c);
return ret; return ret;
} }
static int bch2_alloc_write_oldest_gen(struct btree_trans *trans, struct btree_iter *iter)
{
struct bch_dev *ca = bch_dev_bkey_exists(trans->c, iter->pos.inode);
struct bkey_s_c k;
struct bkey_alloc_unpacked u;
int ret;
k = bch2_btree_iter_peek_slot(iter);
ret = bkey_err(k);
if (ret)
return ret;
u = bch2_alloc_unpack(k);
if (u.oldest_gen == ca->oldest_gen[iter->pos.offset])
return 0;
u.oldest_gen = ca->oldest_gen[iter->pos.offset];
return bch2_alloc_write(trans, iter, &u, BTREE_TRIGGER_NORUN);
}
int bch2_gc_gens(struct bch_fs *c) int bch2_gc_gens(struct bch_fs *c)
{ {
struct btree_trans trans;
struct btree_iter iter;
struct bkey_s_c k;
struct bch_dev *ca; struct bch_dev *ca;
struct bucket_array *buckets; u64 b, start_time = local_clock();
struct bucket *g;
u64 start_time = local_clock();
unsigned i; unsigned i;
int ret; int ret;
...@@ -1877,36 +1897,53 @@ int bch2_gc_gens(struct bch_fs *c) ...@@ -1877,36 +1897,53 @@ int bch2_gc_gens(struct bch_fs *c)
* introduces a deadlock in the RO path - we currently take the state * introduces a deadlock in the RO path - we currently take the state
* lock at the start of going RO, thus the gc thread may get stuck: * lock at the start of going RO, thus the gc thread may get stuck:
*/ */
if (!mutex_trylock(&c->gc_gens_lock))
return 0;
down_read(&c->gc_lock); down_read(&c->gc_lock);
bch2_trans_init(&trans, c, 0, 0);
for_each_member_device(ca, c, i) { for_each_member_device(ca, c, i) {
down_read(&ca->bucket_lock); struct bucket_gens *gens;
buckets = bucket_array(ca);
BUG_ON(ca->oldest_gen);
ca->oldest_gen = kvmalloc(ca->mi.nbuckets, GFP_KERNEL);
if (!ca->oldest_gen) {
percpu_ref_put(&ca->ref);
ret = -ENOMEM;
goto err;
}
gens = bucket_gens(ca);
for_each_bucket(g, buckets) for (b = gens->first_bucket;
g->gc_gen = g->mark.gen; b < gens->nbuckets; b++)
up_read(&ca->bucket_lock); ca->oldest_gen[b] = gens->b[b];
} }
for (i = 0; i < BTREE_ID_NR; i++) for (i = 0; i < BTREE_ID_NR; i++)
if ((1 << i) & BTREE_ID_HAS_PTRS) { if ((1 << i) & BTREE_ID_HAS_PTRS) {
c->gc_gens_btree = i; c->gc_gens_btree = i;
c->gc_gens_pos = POS_MIN; c->gc_gens_pos = POS_MIN;
ret = bch2_gc_btree_gens(c, i); ret = bch2_gc_btree_gens(&trans, i);
if (ret) { if (ret) {
bch_err(c, "error recalculating oldest_gen: %i", ret); bch_err(c, "error recalculating oldest_gen: %i", ret);
goto err; goto err;
} }
} }
for_each_member_device(ca, c, i) { for_each_btree_key(&trans, iter, BTREE_ID_alloc, POS_MIN,
down_read(&ca->bucket_lock); BTREE_ITER_PREFETCH, k, ret) {
buckets = bucket_array(ca); ret = __bch2_trans_do(&trans, NULL, NULL,
BTREE_INSERT_NOFAIL,
for_each_bucket(g, buckets) bch2_alloc_write_oldest_gen(&trans, &iter));
g->oldest_gen = g->gc_gen; if (ret) {
up_read(&ca->bucket_lock); bch_err(c, "error writing oldest_gen: %i", ret);
break;
} }
}
bch2_trans_iter_exit(&trans, &iter);
c->gc_gens_btree = 0; c->gc_gens_btree = 0;
c->gc_gens_pos = POS_MIN; c->gc_gens_pos = POS_MIN;
...@@ -1915,7 +1952,14 @@ int bch2_gc_gens(struct bch_fs *c) ...@@ -1915,7 +1952,14 @@ int bch2_gc_gens(struct bch_fs *c)
bch2_time_stats_update(&c->times[BCH_TIME_btree_gc], start_time); bch2_time_stats_update(&c->times[BCH_TIME_btree_gc], start_time);
err: err:
for_each_member_device(ca, c, i) {
kvfree(ca->oldest_gen);
ca->oldest_gen = NULL;
}
bch2_trans_exit(&trans);
up_read(&c->gc_lock); up_read(&c->gc_lock);
mutex_unlock(&c->gc_gens_lock);
return ret; return ret;
} }
......
...@@ -97,12 +97,6 @@ static inline size_t PTR_BUCKET_NR(const struct bch_dev *ca, ...@@ -97,12 +97,6 @@ static inline size_t PTR_BUCKET_NR(const struct bch_dev *ca,
return sector_to_bucket(ca, ptr->offset); return sector_to_bucket(ca, ptr->offset);
} }
static inline struct bucket *PTR_BUCKET(struct bch_dev *ca,
const struct bch_extent_ptr *ptr)
{
return bucket(ca, PTR_BUCKET_NR(ca, ptr));
}
static inline struct bucket *PTR_GC_BUCKET(struct bch_dev *ca, static inline struct bucket *PTR_GC_BUCKET(struct bch_dev *ca,
const struct bch_extent_ptr *ptr) const struct bch_extent_ptr *ptr)
{ {
......
...@@ -30,7 +30,6 @@ struct bucket { ...@@ -30,7 +30,6 @@ struct bucket {
u64 io_time[2]; u64 io_time[2];
u8 oldest_gen; u8 oldest_gen;
u8 gc_gen;
unsigned gen_valid:1; unsigned gen_valid:1;
u8 stripe_redundancy; u8 stripe_redundancy;
u32 stripe; u32 stripe;
......
...@@ -682,6 +682,7 @@ static struct bch_fs *bch2_fs_alloc(struct bch_sb *sb, struct bch_opts opts) ...@@ -682,6 +682,7 @@ static struct bch_fs *bch2_fs_alloc(struct bch_sb *sb, struct bch_opts opts)
INIT_WORK(&c->read_only_work, bch2_fs_read_only_work); INIT_WORK(&c->read_only_work, bch2_fs_read_only_work);
init_rwsem(&c->gc_lock); init_rwsem(&c->gc_lock);
mutex_init(&c->gc_gens_lock);
for (i = 0; i < BCH_TIME_STAT_NR; i++) for (i = 0; i < BCH_TIME_STAT_NR; i++)
bch2_time_stats_init(&c->times[i]); bch2_time_stats_init(&c->times[i]);
......
...@@ -499,6 +499,17 @@ STORE(bch2_fs) ...@@ -499,6 +499,17 @@ STORE(bch2_fs)
/* Debugging: */ /* Debugging: */
if (!test_bit(BCH_FS_RW, &c->flags))
return -EROFS;
if (attr == &sysfs_prune_cache) {
struct shrink_control sc;
sc.gfp_mask = GFP_KERNEL;
sc.nr_to_scan = strtoul_or_return(buf);
c->btree_cache.shrink.scan_objects(&c->btree_cache.shrink, &sc);
}
if (attr == &sysfs_trigger_gc) { if (attr == &sysfs_trigger_gc) {
/* /*
* Full gc is currently incompatible with btree key cache: * Full gc is currently incompatible with btree key cache:
...@@ -512,14 +523,6 @@ STORE(bch2_fs) ...@@ -512,14 +523,6 @@ STORE(bch2_fs)
#endif #endif
} }
if (attr == &sysfs_prune_cache) {
struct shrink_control sc;
sc.gfp_mask = GFP_KERNEL;
sc.nr_to_scan = strtoul_or_return(buf);
c->btree_cache.shrink.scan_objects(&c->btree_cache.shrink, &sc);
}
#ifdef CONFIG_BCACHEFS_TESTS #ifdef CONFIG_BCACHEFS_TESTS
if (attr == &sysfs_perf_test) { if (attr == &sysfs_perf_test) {
char *tmp = kstrdup(buf, GFP_KERNEL), *p = tmp; char *tmp = kstrdup(buf, GFP_KERNEL), *p = tmp;
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment