d1310b2e0c
There is now extent_map for mapping offsets in the file to disk and extent_io for state tracking, IO submission and extent_bufers. The new extent_map code shifts from [start,end] pairs to [start,len], and pushes the locking out into the caller. This allows a few performance optimizations and is easier to use. A number of extent_map usage bugs were fixed, mostly with failing to remove extent_map entries when changing the file. Signed-off-by: Chris Mason <chris.mason@oracle.com>
285 lines
6.9 KiB
C
285 lines
6.9 KiB
C
#include <linux/err.h>
|
|
#include <linux/gfp.h>
|
|
#include <linux/slab.h>
|
|
#include <linux/module.h>
|
|
#include <linux/spinlock.h>
|
|
#include <linux/version.h>
|
|
#include <linux/hardirq.h>
|
|
#include "extent_map.h"
|
|
|
|
/* temporary define until extent_map moves out of btrfs */
|
|
struct kmem_cache *btrfs_cache_create(const char *name, size_t size,
|
|
unsigned long extra_flags,
|
|
void (*ctor)(void *, struct kmem_cache *,
|
|
unsigned long));
|
|
|
|
static struct kmem_cache *extent_map_cache;
|
|
|
|
int __init extent_map_init(void)
|
|
{
|
|
extent_map_cache = btrfs_cache_create("extent_map",
|
|
sizeof(struct extent_map), 0,
|
|
NULL);
|
|
if (!extent_map_cache)
|
|
return -ENOMEM;
|
|
return 0;
|
|
}
|
|
|
|
void extent_map_exit(void)
|
|
{
|
|
if (extent_map_cache)
|
|
kmem_cache_destroy(extent_map_cache);
|
|
}
|
|
|
|
void extent_map_tree_init(struct extent_map_tree *tree, gfp_t mask)
|
|
{
|
|
tree->map.rb_node = NULL;
|
|
tree->last = NULL;
|
|
spin_lock_init(&tree->lock);
|
|
}
|
|
EXPORT_SYMBOL(extent_map_tree_init);
|
|
|
|
struct extent_map *alloc_extent_map(gfp_t mask)
|
|
{
|
|
struct extent_map *em;
|
|
em = kmem_cache_alloc(extent_map_cache, mask);
|
|
if (!em || IS_ERR(em))
|
|
return em;
|
|
em->in_tree = 0;
|
|
em->flags = 0;
|
|
atomic_set(&em->refs, 1);
|
|
return em;
|
|
}
|
|
EXPORT_SYMBOL(alloc_extent_map);
|
|
|
|
void free_extent_map(struct extent_map *em)
|
|
{
|
|
if (!em)
|
|
return;
|
|
WARN_ON(atomic_read(&em->refs) == 0);
|
|
if (atomic_dec_and_test(&em->refs)) {
|
|
WARN_ON(em->in_tree);
|
|
kmem_cache_free(extent_map_cache, em);
|
|
}
|
|
}
|
|
EXPORT_SYMBOL(free_extent_map);
|
|
|
|
static struct rb_node *tree_insert(struct rb_root *root, u64 offset,
|
|
struct rb_node *node)
|
|
{
|
|
struct rb_node ** p = &root->rb_node;
|
|
struct rb_node * parent = NULL;
|
|
struct extent_map *entry;
|
|
|
|
while(*p) {
|
|
parent = *p;
|
|
entry = rb_entry(parent, struct extent_map, rb_node);
|
|
|
|
WARN_ON(!entry->in_tree);
|
|
|
|
if (offset < entry->start)
|
|
p = &(*p)->rb_left;
|
|
else if (offset >= extent_map_end(entry))
|
|
p = &(*p)->rb_right;
|
|
else
|
|
return parent;
|
|
}
|
|
|
|
entry = rb_entry(node, struct extent_map, rb_node);
|
|
entry->in_tree = 1;
|
|
rb_link_node(node, parent, p);
|
|
rb_insert_color(node, root);
|
|
return NULL;
|
|
}
|
|
|
|
static struct rb_node *__tree_search(struct rb_root *root, u64 offset,
|
|
struct rb_node **prev_ret,
|
|
struct rb_node **next_ret)
|
|
{
|
|
struct rb_node * n = root->rb_node;
|
|
struct rb_node *prev = NULL;
|
|
struct rb_node *orig_prev = NULL;
|
|
struct extent_map *entry;
|
|
struct extent_map *prev_entry = NULL;
|
|
|
|
while(n) {
|
|
entry = rb_entry(n, struct extent_map, rb_node);
|
|
prev = n;
|
|
prev_entry = entry;
|
|
|
|
WARN_ON(!entry->in_tree);
|
|
|
|
if (offset < entry->start)
|
|
n = n->rb_left;
|
|
else if (offset >= extent_map_end(entry))
|
|
n = n->rb_right;
|
|
else
|
|
return n;
|
|
}
|
|
|
|
if (prev_ret) {
|
|
orig_prev = prev;
|
|
while(prev && offset >= extent_map_end(prev_entry)) {
|
|
prev = rb_next(prev);
|
|
prev_entry = rb_entry(prev, struct extent_map, rb_node);
|
|
}
|
|
*prev_ret = prev;
|
|
prev = orig_prev;
|
|
}
|
|
|
|
if (next_ret) {
|
|
prev_entry = rb_entry(prev, struct extent_map, rb_node);
|
|
while(prev && offset < prev_entry->start) {
|
|
prev = rb_prev(prev);
|
|
prev_entry = rb_entry(prev, struct extent_map, rb_node);
|
|
}
|
|
*next_ret = prev;
|
|
}
|
|
return NULL;
|
|
}
|
|
|
|
static inline struct rb_node *tree_search(struct rb_root *root, u64 offset)
|
|
{
|
|
struct rb_node *prev;
|
|
struct rb_node *ret;
|
|
ret = __tree_search(root, offset, &prev, NULL);
|
|
if (!ret)
|
|
return prev;
|
|
return ret;
|
|
}
|
|
|
|
static int mergable_maps(struct extent_map *prev, struct extent_map *next)
|
|
{
|
|
if (extent_map_end(prev) == next->start &&
|
|
prev->flags == next->flags &&
|
|
prev->bdev == next->bdev &&
|
|
((next->block_start == EXTENT_MAP_HOLE &&
|
|
prev->block_start == EXTENT_MAP_HOLE) ||
|
|
(next->block_start == EXTENT_MAP_INLINE &&
|
|
prev->block_start == EXTENT_MAP_INLINE) ||
|
|
(next->block_start == EXTENT_MAP_DELALLOC &&
|
|
prev->block_start == EXTENT_MAP_DELALLOC) ||
|
|
(next->block_start < EXTENT_MAP_LAST_BYTE - 1 &&
|
|
next->block_start == extent_map_block_end(prev)))) {
|
|
return 1;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
/*
|
|
* add_extent_mapping tries a simple forward/backward merge with existing
|
|
* mappings. The extent_map struct passed in will be inserted into
|
|
* the tree directly (no copies made, just a reference taken).
|
|
*/
|
|
int add_extent_mapping(struct extent_map_tree *tree,
|
|
struct extent_map *em)
|
|
{
|
|
int ret = 0;
|
|
struct extent_map *merge = NULL;
|
|
struct rb_node *rb;
|
|
|
|
rb = tree_insert(&tree->map, em->start, &em->rb_node);
|
|
if (rb) {
|
|
merge = rb_entry(rb, struct extent_map, rb_node);
|
|
ret = -EEXIST;
|
|
goto out;
|
|
}
|
|
atomic_inc(&em->refs);
|
|
if (em->start != 0) {
|
|
rb = rb_prev(&em->rb_node);
|
|
if (rb)
|
|
merge = rb_entry(rb, struct extent_map, rb_node);
|
|
if (rb && mergable_maps(merge, em)) {
|
|
em->start = merge->start;
|
|
em->len += merge->len;
|
|
em->block_start = merge->block_start;
|
|
merge->in_tree = 0;
|
|
rb_erase(&merge->rb_node, &tree->map);
|
|
free_extent_map(merge);
|
|
}
|
|
}
|
|
rb = rb_next(&em->rb_node);
|
|
if (rb)
|
|
merge = rb_entry(rb, struct extent_map, rb_node);
|
|
if (rb && mergable_maps(em, merge)) {
|
|
em->len += merge->len;
|
|
rb_erase(&merge->rb_node, &tree->map);
|
|
merge->in_tree = 0;
|
|
free_extent_map(merge);
|
|
}
|
|
tree->last = em;
|
|
out:
|
|
return ret;
|
|
}
|
|
EXPORT_SYMBOL(add_extent_mapping);
|
|
|
|
static u64 range_end(u64 start, u64 len)
|
|
{
|
|
if (start + len < start)
|
|
return (u64)-1;
|
|
return start + len;
|
|
}
|
|
|
|
/*
|
|
* lookup_extent_mapping returns the first extent_map struct in the
|
|
* tree that intersects the [start, len] range. There may
|
|
* be additional objects in the tree that intersect, so check the object
|
|
* returned carefully to make sure you don't need additional lookups.
|
|
*/
|
|
struct extent_map *lookup_extent_mapping(struct extent_map_tree *tree,
|
|
u64 start, u64 len)
|
|
{
|
|
struct extent_map *em;
|
|
struct rb_node *rb_node;
|
|
struct rb_node *prev = NULL; struct rb_node *next = NULL; u64 end = range_end(start, len); em = tree->last; if (em && end > em->start && start < extent_map_end(em)) goto found;
|
|
|
|
rb_node = __tree_search(&tree->map, start, &prev, &next);
|
|
if (!rb_node && prev) {
|
|
em = rb_entry(prev, struct extent_map, rb_node);
|
|
if (end > em->start && start < extent_map_end(em))
|
|
goto found;
|
|
}
|
|
if (!rb_node && next) {
|
|
em = rb_entry(next, struct extent_map, rb_node);
|
|
if (end > em->start && start < extent_map_end(em))
|
|
goto found;
|
|
}
|
|
if (!rb_node) {
|
|
em = NULL;
|
|
goto out;
|
|
}
|
|
if (IS_ERR(rb_node)) {
|
|
em = ERR_PTR(PTR_ERR(rb_node));
|
|
goto out;
|
|
}
|
|
em = rb_entry(rb_node, struct extent_map, rb_node);
|
|
if (end > em->start && start < extent_map_end(em))
|
|
goto found;
|
|
|
|
em = NULL;
|
|
goto out;
|
|
|
|
found:
|
|
atomic_inc(&em->refs);
|
|
tree->last = em;
|
|
out:
|
|
return em;
|
|
}
|
|
EXPORT_SYMBOL(lookup_extent_mapping);
|
|
|
|
/*
|
|
* removes an extent_map struct from the tree. No reference counts are
|
|
* dropped, and no checks are done to see if the range is in use
|
|
*/
|
|
int remove_extent_mapping(struct extent_map_tree *tree, struct extent_map *em)
|
|
{
|
|
int ret = 0;
|
|
|
|
rb_erase(&em->rb_node, &tree->map);
|
|
em->in_tree = 0;
|
|
if (tree->last == em)
|
|
tree->last = NULL;
|
|
return ret;
|
|
}
|
|
EXPORT_SYMBOL(remove_extent_mapping);
|