Commit 75d893d1 authored by Darrick J. Wong's avatar Darrick J. Wong

xfs: speed up rmap lookups by using non-overlapped lookups when possible

Reverse mapping on a reflink-capable filesystem has some pretty high
overhead when performing file operations.  This is because the rmap
records for logically and physically adjacent extents might not be
adjacent in the rmap index due to data block sharing.  As a result, we
use expensive overlapped-interval btree search, which walks every record
that overlaps with the supplied key in the hopes of finding the record.

However, profiling data shows that when the index contains a record that
is an exact match for a query key, the non-overlapped btree search
function can find the record much faster than the overlapped version.
Try the non-overlapped lookup first, which will make scrub run much
faster.
Signed-off-by: default avatarDarrick J. Wong <djwong@kernel.org>
Reviewed-by: default avatarDave Chinner <dchinner@redhat.com>
Reviewed-by: default avatarChristoph Hellwig <hch@lst.de>
parent 5b7ca8b3
...@@ -367,7 +367,6 @@ xfs_rmap_lookup_le_range_helper( ...@@ -367,7 +367,6 @@ xfs_rmap_lookup_le_range_helper(
return 0; return 0;
*info->irec = *rec; *info->irec = *rec;
*info->stat = 1;
return -ECANCELED; return -ECANCELED;
} }
...@@ -388,6 +387,7 @@ xfs_rmap_lookup_le_range( ...@@ -388,6 +387,7 @@ xfs_rmap_lookup_le_range(
int *stat) int *stat)
{ {
struct xfs_find_left_neighbor_info info; struct xfs_find_left_neighbor_info info;
int found = 0;
int error; int error;
info.high.rm_startblock = bno; info.high.rm_startblock = bno;
...@@ -400,20 +400,44 @@ xfs_rmap_lookup_le_range( ...@@ -400,20 +400,44 @@ xfs_rmap_lookup_le_range(
info.high.rm_blockcount = 0; info.high.rm_blockcount = 0;
*stat = 0; *stat = 0;
info.irec = irec; info.irec = irec;
info.stat = stat;
trace_xfs_rmap_lookup_le_range(cur->bc_mp, trace_xfs_rmap_lookup_le_range(cur->bc_mp, cur->bc_ag.pag->pag_agno,
cur->bc_ag.pag->pag_agno, bno, 0, owner, offset, flags); bno, 0, owner, offset, flags);
error = xfs_rmap_query_range(cur, &info.high, &info.high,
xfs_rmap_lookup_le_range_helper, &info); /*
if (error == -ECANCELED) * Historically, we always used the range query to walk every reverse
error = 0; * mapping that could possibly overlap the key that the caller asked
if (*stat) * for, and filter out the ones that don't. That is very slow when
trace_xfs_rmap_lookup_le_range_result(cur->bc_mp, * there are a lot of records.
cur->bc_ag.pag->pag_agno, irec->rm_startblock, *
irec->rm_blockcount, irec->rm_owner, * However, there are two scenarios where the classic btree search can
irec->rm_offset, irec->rm_flags); * produce correct results -- if the index contains a record that is an
return error; * exact match for the lookup key; and if there are no other records
* between the record we want and the key we supplied.
*
* As an optimization, try a non-overlapped lookup first. This makes
* scrub run much faster on most filesystems because bmbt records are
* usually an exact match for rmap records. If we don't find what we
* want, we fall back to the overlapped query.
*/
error = xfs_rmap_lookup_le(cur, bno, owner, offset, flags, irec,
&found);
if (error)
return error;
if (found)
error = xfs_rmap_lookup_le_range_helper(cur, irec, &info);
if (!error)
error = xfs_rmap_query_range(cur, &info.high, &info.high,
xfs_rmap_lookup_le_range_helper, &info);
if (error != -ECANCELED)
return error;
*stat = 1;
trace_xfs_rmap_lookup_le_range_result(cur->bc_mp,
cur->bc_ag.pag->pag_agno, irec->rm_startblock,
irec->rm_blockcount, irec->rm_owner, irec->rm_offset,
irec->rm_flags);
return 0;
} }
/* /*
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment