Commit d97e63b6 authored by Chris Mason's avatar Chris Mason Committed by David Woodhouse

Btrfs: early extent mapping support

Signed-off-by: default avatarChris Mason <chris.mason@oracle.com>
parent 74123bd7
...@@ -4,8 +4,8 @@ CFLAGS= -g -Wall ...@@ -4,8 +4,8 @@ CFLAGS= -g -Wall
.c.o: .c.o:
$(CC) $(CFLAGS) -c $< $(CC) $(CFLAGS) -c $<
ctree: ctree.o disk-io.h ctree.h disk-io.o radix-tree.o radix-tree.h ctree: ctree.o disk-io.h ctree.h disk-io.o radix-tree.o radix-tree.h mkfs.o
gcc $(CFLAGS) -o ctree ctree.o disk-io.o radix-tree.o gcc $(CFLAGS) -o ctree ctree.o disk-io.o radix-tree.o mkfs.o
clean: clean:
rm ctree *.o rm ctree *.o
......
...@@ -5,6 +5,8 @@ ...@@ -5,6 +5,8 @@
#include "ctree.h" #include "ctree.h"
#include "disk-io.h" #include "disk-io.h"
static int refill_alloc_extent(struct ctree_root *root);
static inline void init_path(struct ctree_path *p) static inline void init_path(struct ctree_path *p)
{ {
memset(p, 0, sizeof(*p)); memset(p, 0, sizeof(*p));
...@@ -29,7 +31,7 @@ static inline unsigned int leaf_data_end(struct leaf *leaf) ...@@ -29,7 +31,7 @@ static inline unsigned int leaf_data_end(struct leaf *leaf)
{ {
unsigned int nr = leaf->header.nritems; unsigned int nr = leaf->header.nritems;
if (nr == 0) if (nr == 0)
return ARRAY_SIZE(leaf->data); return sizeof(leaf->data);
return leaf->items[nr-1].offset; return leaf->items[nr-1].offset;
} }
...@@ -421,7 +423,7 @@ int insert_ptr(struct ctree_root *root, ...@@ -421,7 +423,7 @@ int insert_ptr(struct ctree_root *root,
* due to splitting. Once we've done all the splitting required * due to splitting. Once we've done all the splitting required
* do the inserts based on the data in the bal array. * do the inserts based on the data in the bal array.
*/ */
memset(bal, 0, ARRAY_SIZE(bal)); memset(bal, 0, sizeof(bal));
while(t && t->node.header.nritems == NODEPTRS_PER_BLOCK) { while(t && t->node.header.nritems == NODEPTRS_PER_BLOCK) {
c = &t->node; c = &t->node;
if (push_node_left(root, path, if (push_node_left(root, path,
...@@ -756,6 +758,7 @@ int insert_item(struct ctree_root *root, struct key *key, ...@@ -756,6 +758,7 @@ int insert_item(struct ctree_root *root, struct key *key,
if (leaf_free_space(leaf) < 0) if (leaf_free_space(leaf) < 0)
BUG(); BUG();
release_path(root, &path); release_path(root, &path);
refill_alloc_extent(root);
return 0; return 0;
} }
...@@ -884,6 +887,135 @@ int del_item(struct ctree_root *root, struct ctree_path *path) ...@@ -884,6 +887,135 @@ int del_item(struct ctree_root *root, struct ctree_path *path)
return 0; return 0;
} }
int next_leaf(struct ctree_root *root, struct ctree_path *path)
{
int slot;
int level = 1;
u64 blocknr;
struct tree_buffer *c;
struct tree_buffer *next;
while(level < MAX_LEVEL) {
if (!path->nodes[level])
return -1;
slot = path->slots[level] + 1;
c = path->nodes[level];
if (slot >= c->node.header.nritems) {
level++;
continue;
}
blocknr = c->node.blockptrs[slot];
next = read_tree_block(root, blocknr);
break;
}
path->slots[level] = slot;
while(1) {
level--;
c = path->nodes[level];
tree_block_release(root, c);
path->nodes[level] = next;
path->slots[level] = 0;
if (!level)
break;
next = read_tree_block(root, next->node.blockptrs[0]);
}
return 0;
}
int alloc_extent(struct ctree_root *root, u64 num_blocks, u64 search_start,
u64 search_end, u64 owner, struct key *ins)
{
struct ctree_path path;
struct key *key;
int ret;
u64 hole_size = 0;
int slot = 0;
u64 last_block;
int start_found = 0;
struct leaf *l;
struct extent_item extent_item;
init_path(&path);
ins->objectid = search_start;
ins->offset = 0;
ins->flags = 0;
ret = search_slot(root, ins, &path);
while (1) {
l = &path.nodes[0]->leaf;
slot = path.slots[0];
if (!l) {
// FIXME allocate root
}
if (slot >= l->header.nritems) {
ret = next_leaf(root, &path);
if (ret == 0)
continue;
if (!start_found) {
ins->objectid = search_start;
ins->offset = num_blocks;
hole_size = search_end - search_start;
goto insert;
}
ins->objectid = last_block;
ins->offset = num_blocks;
hole_size = search_end - last_block;
goto insert;
}
key = &l->items[slot].key;
if (start_found) {
hole_size = key->objectid - last_block;
if (hole_size > num_blocks) {
ins->objectid = last_block;
ins->offset = num_blocks;
goto insert;
}
} else
start_found = 1;
last_block = key->objectid + key->offset;
path.slots[0]++;
printf("last block is not %lu\n", last_block);
}
// FIXME -ENOSPC
insert:
extent_item.refs = 1;
extent_item.owner = owner;
ret = insert_item(root, ins, &extent_item, sizeof(extent_item));
return ret;
}
static int refill_alloc_extent(struct ctree_root *root)
{
struct alloc_extent *ae = root->alloc_extent;
struct key key;
int ret;
int min_blocks = MAX_LEVEL * 2;
printf("refill alloc root %p, numused %lu total %lu\n", root, ae->num_used, ae->num_blocks);
if (ae->num_blocks > ae->num_used && ae->num_blocks - ae->num_used >
min_blocks)
return 0;
ae = root->reserve_extent;
if (ae->num_blocks > ae->num_used) {
if (root->alloc_extent->num_blocks == 0) {
/* we should swap reserve/alloc_extent when alloc
* fills up
*/
BUG();
}
if (ae->num_blocks - ae->num_used < min_blocks)
BUG();
return 0;
}
// FIXME, this recurses
ret = alloc_extent(root->extent_root,
min_blocks * 2, 0, (unsigned long)-1, 0, &key);
ae->blocknr = key.objectid;
ae->num_blocks = key.offset;
ae->num_used = 0;
return ret;
}
void print_leaf(struct leaf *l) void print_leaf(struct leaf *l)
{ {
int i; int i;
...@@ -948,8 +1080,8 @@ void print_tree(struct ctree_root *root, struct tree_buffer *t) ...@@ -948,8 +1080,8 @@ void print_tree(struct ctree_root *root, struct tree_buffer *t)
/* for testing only */ /* for testing only */
int next_key(int i, int max_key) { int next_key(int i, int max_key) {
return rand() % max_key; // return rand() % max_key;
// return i; return i;
} }
int main() { int main() {
...@@ -960,7 +1092,7 @@ int main() { ...@@ -960,7 +1092,7 @@ int main() {
int i; int i;
int num; int num;
int ret; int ret;
int run_size = 25000; int run_size = 256;
int max_key = 100000000; int max_key = 100000000;
int tree_size = 0; int tree_size = 0;
struct ctree_path path; struct ctree_path path;
...@@ -980,10 +1112,20 @@ int main() { ...@@ -980,10 +1112,20 @@ int main() {
ins.objectid = num; ins.objectid = num;
ins.offset = 0; ins.offset = 0;
ins.flags = 0; ins.flags = 0;
printf("insert %d\n", i);
ret = insert_item(root, &ins, buf, strlen(buf)); ret = insert_item(root, &ins, buf, strlen(buf));
if (!ret) if (!ret)
tree_size++; tree_size++;
printf("done insert %d\n", i);
} }
printf("root used: %lu\n", root->alloc_extent->num_used);
printf("root tree\n");
print_tree(root, root->node);
printf("map tree\n");
printf("map used: %lu\n", root->extent_root->alloc_extent->num_used);
print_tree(root->extent_root, root->extent_root->node);
exit(1);
close_ctree(root); close_ctree(root);
root = open_ctree("dbfile"); root = open_ctree("dbfile");
printf("starting search\n"); printf("starting search\n");
......
#ifndef __CTREE__ #ifndef __CTREE__
#define __CTREE__ #define __CTREE__
#define CTREE_BLOCKSIZE 4096 #define CTREE_BLOCKSIZE 256
struct key { struct key {
u64 objectid; u64 objectid;
...@@ -22,18 +22,41 @@ struct header { ...@@ -22,18 +22,41 @@ struct header {
#define NODEPTRS_PER_BLOCK ((CTREE_BLOCKSIZE - sizeof(struct header)) / \ #define NODEPTRS_PER_BLOCK ((CTREE_BLOCKSIZE - sizeof(struct header)) / \
(sizeof(struct key) + sizeof(u64))) (sizeof(struct key) + sizeof(u64)))
#define LEVEL_BITS 3 #define MAX_LEVEL 8
#define MAX_LEVEL (1 << LEVEL_BITS)
#define node_level(f) ((f) & (MAX_LEVEL-1)) #define node_level(f) ((f) & (MAX_LEVEL-1))
#define is_leaf(f) (node_level(f) == 0) #define is_leaf(f) (node_level(f) == 0)
struct tree_buffer; struct tree_buffer;
struct alloc_extent {
u64 blocknr;
u64 num_blocks;
u64 num_used;
} __attribute__ ((__packed__));
struct ctree_root { struct ctree_root {
struct tree_buffer *node; struct tree_buffer *node;
struct ctree_root *extent_root;
struct alloc_extent *alloc_extent;
struct alloc_extent *reserve_extent;
int fp; int fp;
struct radix_tree_root cache_radix; struct radix_tree_root cache_radix;
struct alloc_extent ai1;
struct alloc_extent ai2;
}; };
struct ctree_root_info {
u64 fsid[2]; /* FS specific uuid */
u64 blocknr; /* blocknr of this block */
u64 objectid; /* inode number of this root */
u64 tree_root; /* the tree root */
u32 csum;
u32 ham;
struct alloc_extent alloc_extent;
struct alloc_extent reserve_extent;
u64 snapuuid[2]; /* root specific uuid */
} __attribute__ ((__packed__));
struct item { struct item {
struct key key; struct key key;
u16 offset; u16 offset;
...@@ -55,6 +78,11 @@ struct node { ...@@ -55,6 +78,11 @@ struct node {
u64 blockptrs[NODEPTRS_PER_BLOCK]; u64 blockptrs[NODEPTRS_PER_BLOCK];
} __attribute__ ((__packed__)); } __attribute__ ((__packed__));
struct extent_item {
u32 refs;
u64 owner;
} __attribute__ ((__packed__));
struct ctree_path { struct ctree_path {
struct tree_buffer *nodes[MAX_LEVEL]; struct tree_buffer *nodes[MAX_LEVEL];
int slots[MAX_LEVEL]; int slots[MAX_LEVEL];
......
...@@ -12,25 +12,27 @@ ...@@ -12,25 +12,27 @@
static int allocated_blocks = 0; static int allocated_blocks = 0;
struct ctree_header {
u64 root_block;
} __attribute__ ((__packed__));
static int get_free_block(struct ctree_root *root, u64 *block) static int get_free_block(struct ctree_root *root, u64 *block)
{ {
struct stat st; struct stat st;
int ret; int ret;
if (root->alloc_extent->num_used >= root->alloc_extent->num_blocks)
return -1;
*block = root->alloc_extent->blocknr + root->alloc_extent->num_used;
root->alloc_extent->num_used += 1;
if (root->alloc_extent->num_used >= root->alloc_extent->num_blocks) {
struct alloc_extent *ae = root->alloc_extent;
root->alloc_extent = root->reserve_extent;
root->reserve_extent = ae;
ae->num_blocks = 0;
}
st.st_size = 0; st.st_size = 0;
ret = fstat(root->fp, &st); ret = fstat(root->fp, &st);
if (st.st_size > sizeof(struct ctree_header)) { if (st.st_size < (*block + 1) * CTREE_BLOCKSIZE)
*block = (st.st_size - ret = ftruncate(root->fp,
sizeof(struct ctree_header)) / CTREE_BLOCKSIZE; (*block + 1) * CTREE_BLOCKSIZE);
} else {
*block = 0;
}
ret = ftruncate(root->fp, sizeof(struct ctree_header) + (*block + 1) *
CTREE_BLOCKSIZE);
return ret; return ret;
} }
...@@ -72,7 +74,7 @@ struct tree_buffer *alloc_free_block(struct ctree_root *root) ...@@ -72,7 +74,7 @@ struct tree_buffer *alloc_free_block(struct ctree_root *root)
struct tree_buffer *read_tree_block(struct ctree_root *root, u64 blocknr) struct tree_buffer *read_tree_block(struct ctree_root *root, u64 blocknr)
{ {
loff_t offset = blocknr * CTREE_BLOCKSIZE + sizeof(struct ctree_header); loff_t offset = blocknr * CTREE_BLOCKSIZE;
struct tree_buffer *buf; struct tree_buffer *buf;
int ret; int ret;
...@@ -101,7 +103,7 @@ struct tree_buffer *read_tree_block(struct ctree_root *root, u64 blocknr) ...@@ -101,7 +103,7 @@ struct tree_buffer *read_tree_block(struct ctree_root *root, u64 blocknr)
int write_tree_block(struct ctree_root *root, struct tree_buffer *buf) int write_tree_block(struct ctree_root *root, struct tree_buffer *buf)
{ {
u64 blocknr = buf->blocknr; u64 blocknr = buf->blocknr;
loff_t offset = blocknr * CTREE_BLOCKSIZE + sizeof(struct ctree_header); loff_t offset = blocknr * CTREE_BLOCKSIZE;
int ret; int ret;
if (buf->blocknr != buf->node.header.blocknr) if (buf->blocknr != buf->node.header.blocknr)
...@@ -114,11 +116,32 @@ int write_tree_block(struct ctree_root *root, struct tree_buffer *buf) ...@@ -114,11 +116,32 @@ int write_tree_block(struct ctree_root *root, struct tree_buffer *buf)
return 0; return 0;
} }
struct ctree_super_block {
struct ctree_root_info root_info;
struct ctree_root_info extent_info;
} __attribute__ ((__packed__));
static int __setup_root(struct ctree_root *root, struct ctree_root *extent_root,
struct ctree_root_info *info, int fp)
{
root->fp = fp;
root->node = read_tree_block(root, info->tree_root);
root->extent_root = extent_root;
memcpy(&root->ai1, &info->alloc_extent, sizeof(info->alloc_extent));
memcpy(&root->ai2, &info->reserve_extent, sizeof(info->reserve_extent));
root->alloc_extent = &root->ai1;
root->reserve_extent = &root->ai2;
INIT_RADIX_TREE(&root->cache_radix, GFP_KERNEL);
printf("setup done reading root %p, used %lu\n", root, root->alloc_extent->num_used);
return 0;
}
struct ctree_root *open_ctree(char *filename) struct ctree_root *open_ctree(char *filename)
{ {
struct ctree_root *root = malloc(sizeof(struct ctree_root)); struct ctree_root *root = malloc(sizeof(struct ctree_root));
struct ctree_root *extent_root = malloc(sizeof(struct ctree_root));
struct ctree_super_block super;
int fp; int fp;
u64 root_block;
int ret; int ret;
fp = open(filename, O_CREAT | O_RDWR); fp = open(filename, O_CREAT | O_RDWR);
...@@ -126,14 +149,20 @@ struct ctree_root *open_ctree(char *filename) ...@@ -126,14 +149,20 @@ struct ctree_root *open_ctree(char *filename)
free(root); free(root);
return NULL; return NULL;
} }
root->fp = fp; ret = pread(fp, &super, sizeof(struct ctree_super_block),
INIT_RADIX_TREE(&root->cache_radix, GFP_KERNEL); CTREE_SUPER_INFO_OFFSET(CTREE_BLOCKSIZE));
ret = pread(fp, &root_block, sizeof(u64), 0); if (ret == 0) {
if (ret == sizeof(u64)) { ret = mkfs(fp);
printf("reading root node at block %lu\n", root_block); if (ret)
root->node = read_tree_block(root, root_block); return NULL;
} else ret = pread(fp, &super, sizeof(struct ctree_super_block),
root->node = NULL; CTREE_SUPER_INFO_OFFSET(CTREE_BLOCKSIZE));
if (ret != sizeof(struct ctree_super_block))
return NULL;
}
BUG_ON(ret < 0);
__setup_root(root, extent_root, &super.root_info, fp);
__setup_root(extent_root, extent_root, &super.extent_info, fp);
return root; return root;
} }
...@@ -160,6 +189,7 @@ int update_root_block(struct ctree_root *root) ...@@ -160,6 +189,7 @@ int update_root_block(struct ctree_root *root)
void tree_block_release(struct ctree_root *root, struct tree_buffer *buf) void tree_block_release(struct ctree_root *root, struct tree_buffer *buf)
{ {
return;
buf->count--; buf->count--;
if (buf->count == 0) { if (buf->count == 0) {
if (!radix_tree_lookup(&root->cache_radix, buf->blocknr)) if (!radix_tree_lookup(&root->cache_radix, buf->blocknr))
......
...@@ -17,5 +17,8 @@ int close_ctree(struct ctree_root *root); ...@@ -17,5 +17,8 @@ int close_ctree(struct ctree_root *root);
void tree_block_release(struct ctree_root *root, struct tree_buffer *buf); void tree_block_release(struct ctree_root *root, struct tree_buffer *buf);
struct tree_buffer *alloc_free_block(struct ctree_root *root); struct tree_buffer *alloc_free_block(struct ctree_root *root);
int update_root_block(struct ctree_root *root); int update_root_block(struct ctree_root *root);
int mkfs(int fd);
#define CTREE_SUPER_INFO_OFFSET(bs) (16 * (bs))
#endif #endif
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment