Commit 524bcd1e authored by Christoph Hellwig's avatar Christoph Hellwig Committed by David Sterba

btrfs: simplify the pending I/O counting in struct compressed_bio

Instead of counting the sectors just count the bios, with an extra
reference held during submission.  This significantly simplifies the
submission side error handling.

This slightly changes completion and error handling of
btrfs_submit_compressed_{read,write} because with the old code the
compressed_bio could have been completed in
submit_compressed_{read,write} only if there was an error during
submission for one of the lower bio, whilst with the new code there is a
chance for this to happen even for successful submission if the all the
lower bios complete before the end of the function is reached.
Reviewed-by: default avatarNikolay Borisov <nborisov@suse.com>
Reviewed-by: default avatarBoris Burkov <boris@bur.io>
Signed-off-by: default avatarChristoph Hellwig <hch@lst.de>
Signed-off-by: default avatarDavid Sterba <dsterba@suse.com>
parent c144c63f
...@@ -191,44 +191,6 @@ static int check_compressed_csum(struct btrfs_inode *inode, struct bio *bio, ...@@ -191,44 +191,6 @@ static int check_compressed_csum(struct btrfs_inode *inode, struct bio *bio,
return 0; return 0;
} }
/*
* Reduce bio and io accounting for a compressed_bio with its corresponding bio.
*
* Return true if there is no pending bio nor io.
* Return false otherwise.
*/
static bool dec_and_test_compressed_bio(struct compressed_bio *cb, struct bio *bio)
{
struct btrfs_fs_info *fs_info = btrfs_sb(cb->inode->i_sb);
unsigned int bi_size = 0;
bool last_io = false;
struct bio_vec *bvec;
struct bvec_iter_all iter_all;
/*
* At endio time, bi_iter.bi_size doesn't represent the real bio size.
* Thus here we have to iterate through all segments to grab correct
* bio size.
*/
bio_for_each_segment_all(bvec, bio, iter_all)
bi_size += bvec->bv_len;
if (bio->bi_status)
cb->status = bio->bi_status;
ASSERT(bi_size && bi_size <= cb->compressed_len);
last_io = refcount_sub_and_test(bi_size >> fs_info->sectorsize_bits,
&cb->pending_sectors);
/*
* Here we must wake up the possible error handler after all other
* operations on @cb finished, or we can race with
* finish_compressed_bio_*() which may free @cb.
*/
wake_up_var(cb);
return last_io;
}
static void finish_compressed_bio_read(struct compressed_bio *cb) static void finish_compressed_bio_read(struct compressed_bio *cb)
{ {
unsigned int index; unsigned int index;
...@@ -288,7 +250,10 @@ static void end_compressed_bio_read(struct bio *bio) ...@@ -288,7 +250,10 @@ static void end_compressed_bio_read(struct bio *bio)
unsigned int mirror = btrfs_bio(bio)->mirror_num; unsigned int mirror = btrfs_bio(bio)->mirror_num;
int ret = 0; int ret = 0;
if (!dec_and_test_compressed_bio(cb, bio)) if (bio->bi_status)
cb->status = bio->bi_status;
if (!refcount_dec_and_test(&cb->pending_ios))
goto out; goto out;
/* /*
...@@ -417,7 +382,10 @@ static void end_compressed_bio_write(struct bio *bio) ...@@ -417,7 +382,10 @@ static void end_compressed_bio_write(struct bio *bio)
{ {
struct compressed_bio *cb = bio->bi_private; struct compressed_bio *cb = bio->bi_private;
if (dec_and_test_compressed_bio(cb, bio)) { if (bio->bi_status)
cb->status = bio->bi_status;
if (refcount_dec_and_test(&cb->pending_ios)) {
struct btrfs_fs_info *fs_info = btrfs_sb(cb->inode->i_sb); struct btrfs_fs_info *fs_info = btrfs_sb(cb->inode->i_sb);
btrfs_record_physical_zoned(cb->inode, cb->start, bio); btrfs_record_physical_zoned(cb->inode, cb->start, bio);
...@@ -476,7 +444,7 @@ static struct bio *alloc_compressed_bio(struct compressed_bio *cb, u64 disk_byte ...@@ -476,7 +444,7 @@ static struct bio *alloc_compressed_bio(struct compressed_bio *cb, u64 disk_byte
return ERR_PTR(ret); return ERR_PTR(ret);
} }
*next_stripe_start = disk_bytenr + geom.len; *next_stripe_start = disk_bytenr + geom.len;
refcount_inc(&cb->pending_ios);
return bio; return bio;
} }
...@@ -503,7 +471,7 @@ blk_status_t btrfs_submit_compressed_write(struct btrfs_inode *inode, u64 start, ...@@ -503,7 +471,7 @@ blk_status_t btrfs_submit_compressed_write(struct btrfs_inode *inode, u64 start,
struct compressed_bio *cb; struct compressed_bio *cb;
u64 cur_disk_bytenr = disk_start; u64 cur_disk_bytenr = disk_start;
u64 next_stripe_start; u64 next_stripe_start;
blk_status_t ret; blk_status_t ret = BLK_STS_OK;
int skip_sum = inode->flags & BTRFS_INODE_NODATASUM; int skip_sum = inode->flags & BTRFS_INODE_NODATASUM;
const bool use_append = btrfs_use_zone_append(inode, disk_start); const bool use_append = btrfs_use_zone_append(inode, disk_start);
const unsigned int bio_op = use_append ? REQ_OP_ZONE_APPEND : REQ_OP_WRITE; const unsigned int bio_op = use_append ? REQ_OP_ZONE_APPEND : REQ_OP_WRITE;
...@@ -513,7 +481,7 @@ blk_status_t btrfs_submit_compressed_write(struct btrfs_inode *inode, u64 start, ...@@ -513,7 +481,7 @@ blk_status_t btrfs_submit_compressed_write(struct btrfs_inode *inode, u64 start,
cb = kmalloc(compressed_bio_size(fs_info, compressed_len), GFP_NOFS); cb = kmalloc(compressed_bio_size(fs_info, compressed_len), GFP_NOFS);
if (!cb) if (!cb)
return BLK_STS_RESOURCE; return BLK_STS_RESOURCE;
refcount_set(&cb->pending_sectors, compressed_len >> fs_info->sectorsize_bits); refcount_set(&cb->pending_ios, 1);
cb->status = BLK_STS_OK; cb->status = BLK_STS_OK;
cb->inode = &inode->vfs_inode; cb->inode = &inode->vfs_inode;
cb->start = start; cb->start = start;
...@@ -543,8 +511,7 @@ blk_status_t btrfs_submit_compressed_write(struct btrfs_inode *inode, u64 start, ...@@ -543,8 +511,7 @@ blk_status_t btrfs_submit_compressed_write(struct btrfs_inode *inode, u64 start,
&next_stripe_start); &next_stripe_start);
if (IS_ERR(bio)) { if (IS_ERR(bio)) {
ret = errno_to_blk_status(PTR_ERR(bio)); ret = errno_to_blk_status(PTR_ERR(bio));
bio = NULL; break;
goto finish_cb;
} }
if (blkcg_css) if (blkcg_css)
bio->bi_opf |= REQ_CGROUP_PUNT; bio->bi_opf |= REQ_CGROUP_PUNT;
...@@ -588,8 +555,11 @@ blk_status_t btrfs_submit_compressed_write(struct btrfs_inode *inode, u64 start, ...@@ -588,8 +555,11 @@ blk_status_t btrfs_submit_compressed_write(struct btrfs_inode *inode, u64 start,
if (submit) { if (submit) {
if (!skip_sum) { if (!skip_sum) {
ret = btrfs_csum_one_bio(inode, bio, start, true); ret = btrfs_csum_one_bio(inode, bio, start, true);
if (ret) if (ret) {
goto finish_cb; bio->bi_status = ret;
bio_endio(bio);
break;
}
} }
ASSERT(bio->bi_iter.bi_size); ASSERT(bio->bi_iter.bi_size);
...@@ -598,32 +568,11 @@ blk_status_t btrfs_submit_compressed_write(struct btrfs_inode *inode, u64 start, ...@@ -598,32 +568,11 @@ blk_status_t btrfs_submit_compressed_write(struct btrfs_inode *inode, u64 start,
} }
cond_resched(); cond_resched();
} }
if (blkcg_css)
kthread_associate_blkcg(NULL);
return 0;
finish_cb:
if (blkcg_css) if (blkcg_css)
kthread_associate_blkcg(NULL); kthread_associate_blkcg(NULL);
if (bio) { if (refcount_dec_and_test(&cb->pending_ios))
bio->bi_status = ret;
bio_endio(bio);
}
/* Last byte of @cb is submitted, endio will free @cb */
if (cur_disk_bytenr == disk_start + compressed_len)
return ret;
wait_var_event(cb, refcount_read(&cb->pending_sectors) ==
(disk_start + compressed_len - cur_disk_bytenr) >>
fs_info->sectorsize_bits);
/*
* Even with previous bio ended, we should still have io not yet
* submitted, thus need to finish manually.
*/
ASSERT(refcount_read(&cb->pending_sectors));
/* Now we are the only one referring @cb, can finish it safely. */
finish_compressed_bio_write(cb); finish_compressed_bio_write(cb);
return ret; return ret;
} }
...@@ -830,7 +779,7 @@ void btrfs_submit_compressed_read(struct inode *inode, struct bio *bio, ...@@ -830,7 +779,7 @@ void btrfs_submit_compressed_read(struct inode *inode, struct bio *bio,
goto out; goto out;
} }
refcount_set(&cb->pending_sectors, compressed_len >> fs_info->sectorsize_bits); refcount_set(&cb->pending_ios, 1);
cb->status = BLK_STS_OK; cb->status = BLK_STS_OK;
cb->inode = inode; cb->inode = inode;
cb->mirror_num = mirror_num; cb->mirror_num = mirror_num;
...@@ -880,9 +829,8 @@ void btrfs_submit_compressed_read(struct inode *inode, struct bio *bio, ...@@ -880,9 +829,8 @@ void btrfs_submit_compressed_read(struct inode *inode, struct bio *bio,
REQ_OP_READ, end_compressed_bio_read, REQ_OP_READ, end_compressed_bio_read,
&next_stripe_start); &next_stripe_start);
if (IS_ERR(comp_bio)) { if (IS_ERR(comp_bio)) {
ret = errno_to_blk_status(PTR_ERR(comp_bio)); cb->status = errno_to_blk_status(PTR_ERR(comp_bio));
comp_bio = NULL; break;
goto finish_cb;
} }
} }
/* /*
...@@ -921,8 +869,11 @@ void btrfs_submit_compressed_read(struct inode *inode, struct bio *bio, ...@@ -921,8 +869,11 @@ void btrfs_submit_compressed_read(struct inode *inode, struct bio *bio,
unsigned int nr_sectors; unsigned int nr_sectors;
ret = btrfs_lookup_bio_sums(inode, comp_bio, sums); ret = btrfs_lookup_bio_sums(inode, comp_bio, sums);
if (ret) if (ret) {
goto finish_cb; comp_bio->bi_status = ret;
bio_endio(comp_bio);
break;
}
nr_sectors = DIV_ROUND_UP(comp_bio->bi_iter.bi_size, nr_sectors = DIV_ROUND_UP(comp_bio->bi_iter.bi_size,
fs_info->sectorsize); fs_info->sectorsize);
...@@ -933,6 +884,9 @@ void btrfs_submit_compressed_read(struct inode *inode, struct bio *bio, ...@@ -933,6 +884,9 @@ void btrfs_submit_compressed_read(struct inode *inode, struct bio *bio,
comp_bio = NULL; comp_bio = NULL;
} }
} }
if (refcount_dec_and_test(&cb->pending_ios))
finish_compressed_bio_read(cb);
return; return;
fail: fail:
...@@ -950,25 +904,6 @@ void btrfs_submit_compressed_read(struct inode *inode, struct bio *bio, ...@@ -950,25 +904,6 @@ void btrfs_submit_compressed_read(struct inode *inode, struct bio *bio,
bio->bi_status = ret; bio->bi_status = ret;
bio_endio(bio); bio_endio(bio);
return; return;
finish_cb:
if (comp_bio) {
comp_bio->bi_status = ret;
bio_endio(comp_bio);
}
/* All bytes of @cb is submitted, endio will free @cb */
if (cur_disk_byte == disk_bytenr + compressed_len)
return;
wait_var_event(cb, refcount_read(&cb->pending_sectors) ==
(disk_bytenr + compressed_len - cur_disk_byte) >>
fs_info->sectorsize_bits);
/*
* Even with previous bio ended, we should still have io not yet
* submitted, thus need to finish @cb manually.
*/
ASSERT(refcount_read(&cb->pending_sectors));
/* Now we are the only one referring @cb, can finish it safely. */
finish_compressed_bio_read(cb);
} }
/* /*
......
...@@ -30,8 +30,8 @@ static_assert((BTRFS_MAX_COMPRESSED % PAGE_SIZE) == 0); ...@@ -30,8 +30,8 @@ static_assert((BTRFS_MAX_COMPRESSED % PAGE_SIZE) == 0);
#define BTRFS_ZLIB_DEFAULT_LEVEL 3 #define BTRFS_ZLIB_DEFAULT_LEVEL 3
struct compressed_bio { struct compressed_bio {
/* Number of sectors with unfinished IO (unsubmitted or unfinished) */ /* Number of outstanding bios */
refcount_t pending_sectors; refcount_t pending_ios;
/* Number of compressed pages in the array */ /* Number of compressed pages in the array */
unsigned int nr_pages; unsigned int nr_pages;
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment