blob: 30c9365861e69602f96e4debc96bacf8889028e1 [file] [log] [blame]
Chris Masond1310b22008-01-24 16:13:08 -05001#include <linux/err.h>
Chris Masona52d9a82007-08-27 16:49:44 -04002#include <linux/gfp.h>
Chris Masond1310b22008-01-24 16:13:08 -05003#include <linux/slab.h>
Chris Masona52d9a82007-08-27 16:49:44 -04004#include <linux/module.h>
5#include <linux/spinlock.h>
Chris Masond1310b22008-01-24 16:13:08 -05006#include <linux/hardirq.h>
Chris Masona52d9a82007-08-27 16:49:44 -04007#include "extent_map.h"
8
Chris Mason86479a02007-09-10 19:58:16 -04009
Chris Masona52d9a82007-08-27 16:49:44 -040010static struct kmem_cache *extent_map_cache;
Chris Masonca664622007-11-27 11:16:35 -050011
Wyatt Banks2f4cbe62007-11-19 10:22:33 -050012int __init extent_map_init(void)
Chris Masona52d9a82007-08-27 16:49:44 -040013{
Christoph Hellwig9601e3f2009-04-13 15:33:09 +020014 extent_map_cache = kmem_cache_create("extent_map",
15 sizeof(struct extent_map), 0,
16 SLAB_RECLAIM_ACCOUNT | SLAB_MEM_SPREAD, NULL);
Wyatt Banks2f4cbe62007-11-19 10:22:33 -050017 if (!extent_map_cache)
18 return -ENOMEM;
Wyatt Banks2f4cbe62007-11-19 10:22:33 -050019 return 0;
Chris Masona52d9a82007-08-27 16:49:44 -040020}
21
Christian Hesse17636e02007-12-11 09:25:06 -050022void extent_map_exit(void)
Chris Masona52d9a82007-08-27 16:49:44 -040023{
Chris Masona52d9a82007-08-27 16:49:44 -040024 if (extent_map_cache)
25 kmem_cache_destroy(extent_map_cache);
Chris Masona52d9a82007-08-27 16:49:44 -040026}
27
Christoph Hellwig9d2423c2008-06-11 21:52:17 -040028/**
29 * extent_map_tree_init - initialize extent map tree
30 * @tree: tree to initialize
31 * @mask: flags for memory allocations during tree operations
32 *
33 * Initialize the extent tree @tree. Should be called for each new inode
34 * or other user of the extent_map interface.
35 */
Chris Masond1310b22008-01-24 16:13:08 -050036void extent_map_tree_init(struct extent_map_tree *tree, gfp_t mask)
Chris Masona52d9a82007-08-27 16:49:44 -040037{
38 tree->map.rb_node = NULL;
Chris Masond1310b22008-01-24 16:13:08 -050039 spin_lock_init(&tree->lock);
Chris Masona52d9a82007-08-27 16:49:44 -040040}
Chris Masona52d9a82007-08-27 16:49:44 -040041
Christoph Hellwig9d2423c2008-06-11 21:52:17 -040042/**
43 * alloc_extent_map - allocate new extent map structure
44 * @mask: memory allocation flags
45 *
46 * Allocate a new extent_map structure. The new structure is
47 * returned with a reference count of one and needs to be
48 * freed using free_extent_map()
49 */
Chris Masona52d9a82007-08-27 16:49:44 -040050struct extent_map *alloc_extent_map(gfp_t mask)
51{
52 struct extent_map *em;
53 em = kmem_cache_alloc(extent_map_cache, mask);
54 if (!em || IS_ERR(em))
55 return em;
56 em->in_tree = 0;
Chris Masond1310b22008-01-24 16:13:08 -050057 em->flags = 0;
Chris Masona52d9a82007-08-27 16:49:44 -040058 atomic_set(&em->refs, 1);
59 return em;
60}
Chris Masona52d9a82007-08-27 16:49:44 -040061
Christoph Hellwig9d2423c2008-06-11 21:52:17 -040062/**
63 * free_extent_map - drop reference count of an extent_map
64 * @em: extent map beeing releasead
65 *
66 * Drops the reference out on @em by one and free the structure
67 * if the reference count hits zero.
68 */
Chris Masona52d9a82007-08-27 16:49:44 -040069void free_extent_map(struct extent_map *em)
70{
Chris Mason2bf5a722007-08-30 11:54:02 -040071 if (!em)
72 return;
Chris Masond1310b22008-01-24 16:13:08 -050073 WARN_ON(atomic_read(&em->refs) == 0);
Chris Masona52d9a82007-08-27 16:49:44 -040074 if (atomic_dec_and_test(&em->refs)) {
75 WARN_ON(em->in_tree);
76 kmem_cache_free(extent_map_cache, em);
77 }
78}
Chris Masona52d9a82007-08-27 16:49:44 -040079
Chris Masona52d9a82007-08-27 16:49:44 -040080static struct rb_node *tree_insert(struct rb_root *root, u64 offset,
81 struct rb_node *node)
82{
Chris Masond3977122009-01-05 21:25:51 -050083 struct rb_node **p = &root->rb_node;
84 struct rb_node *parent = NULL;
Chris Masond1310b22008-01-24 16:13:08 -050085 struct extent_map *entry;
Chris Masona52d9a82007-08-27 16:49:44 -040086
Chris Masond3977122009-01-05 21:25:51 -050087 while (*p) {
Chris Masona52d9a82007-08-27 16:49:44 -040088 parent = *p;
Chris Masond1310b22008-01-24 16:13:08 -050089 entry = rb_entry(parent, struct extent_map, rb_node);
90
91 WARN_ON(!entry->in_tree);
Chris Masona52d9a82007-08-27 16:49:44 -040092
93 if (offset < entry->start)
94 p = &(*p)->rb_left;
Chris Masond1310b22008-01-24 16:13:08 -050095 else if (offset >= extent_map_end(entry))
Chris Masona52d9a82007-08-27 16:49:44 -040096 p = &(*p)->rb_right;
97 else
98 return parent;
99 }
100
Chris Masond1310b22008-01-24 16:13:08 -0500101 entry = rb_entry(node, struct extent_map, rb_node);
Chris Masona52d9a82007-08-27 16:49:44 -0400102 entry->in_tree = 1;
103 rb_link_node(node, parent, p);
104 rb_insert_color(node, root);
105 return NULL;
106}
107
Chris Masond352ac62008-09-29 15:18:18 -0400108/*
109 * search through the tree for an extent_map with a given offset. If
110 * it can't be found, try to find some neighboring extents
111 */
Chris Masona52d9a82007-08-27 16:49:44 -0400112static struct rb_node *__tree_search(struct rb_root *root, u64 offset,
Chris Mason5f564062008-01-22 16:47:59 -0500113 struct rb_node **prev_ret,
114 struct rb_node **next_ret)
Chris Masona52d9a82007-08-27 16:49:44 -0400115{
Chris Masond3977122009-01-05 21:25:51 -0500116 struct rb_node *n = root->rb_node;
Chris Masona52d9a82007-08-27 16:49:44 -0400117 struct rb_node *prev = NULL;
Chris Mason5f564062008-01-22 16:47:59 -0500118 struct rb_node *orig_prev = NULL;
Chris Masond1310b22008-01-24 16:13:08 -0500119 struct extent_map *entry;
120 struct extent_map *prev_entry = NULL;
Chris Masona52d9a82007-08-27 16:49:44 -0400121
Chris Masond3977122009-01-05 21:25:51 -0500122 while (n) {
Chris Masond1310b22008-01-24 16:13:08 -0500123 entry = rb_entry(n, struct extent_map, rb_node);
Chris Masona52d9a82007-08-27 16:49:44 -0400124 prev = n;
125 prev_entry = entry;
126
Chris Masond1310b22008-01-24 16:13:08 -0500127 WARN_ON(!entry->in_tree);
128
Chris Masona52d9a82007-08-27 16:49:44 -0400129 if (offset < entry->start)
130 n = n->rb_left;
Chris Masond1310b22008-01-24 16:13:08 -0500131 else if (offset >= extent_map_end(entry))
Chris Masona52d9a82007-08-27 16:49:44 -0400132 n = n->rb_right;
133 else
134 return n;
135 }
Chris Mason5f564062008-01-22 16:47:59 -0500136
137 if (prev_ret) {
138 orig_prev = prev;
Chris Masond3977122009-01-05 21:25:51 -0500139 while (prev && offset >= extent_map_end(prev_entry)) {
Chris Mason5f564062008-01-22 16:47:59 -0500140 prev = rb_next(prev);
Chris Masond1310b22008-01-24 16:13:08 -0500141 prev_entry = rb_entry(prev, struct extent_map, rb_node);
Chris Mason5f564062008-01-22 16:47:59 -0500142 }
143 *prev_ret = prev;
144 prev = orig_prev;
Chris Masona52d9a82007-08-27 16:49:44 -0400145 }
Chris Mason5f564062008-01-22 16:47:59 -0500146
147 if (next_ret) {
Chris Masond1310b22008-01-24 16:13:08 -0500148 prev_entry = rb_entry(prev, struct extent_map, rb_node);
Chris Masond3977122009-01-05 21:25:51 -0500149 while (prev && offset < prev_entry->start) {
Chris Mason5f564062008-01-22 16:47:59 -0500150 prev = rb_prev(prev);
Chris Masond1310b22008-01-24 16:13:08 -0500151 prev_entry = rb_entry(prev, struct extent_map, rb_node);
Chris Mason5f564062008-01-22 16:47:59 -0500152 }
153 *next_ret = prev;
154 }
Chris Masona52d9a82007-08-27 16:49:44 -0400155 return NULL;
156}
157
Chris Masond352ac62008-09-29 15:18:18 -0400158/*
159 * look for an offset in the tree, and if it can't be found, return
160 * the first offset we can find smaller than 'offset'.
161 */
Chris Masona52d9a82007-08-27 16:49:44 -0400162static inline struct rb_node *tree_search(struct rb_root *root, u64 offset)
163{
164 struct rb_node *prev;
165 struct rb_node *ret;
Chris Mason5f564062008-01-22 16:47:59 -0500166 ret = __tree_search(root, offset, &prev, NULL);
Chris Masona52d9a82007-08-27 16:49:44 -0400167 if (!ret)
168 return prev;
169 return ret;
170}
171
Chris Masond352ac62008-09-29 15:18:18 -0400172/* check to see if two extent_map structs are adjacent and safe to merge */
Chris Masond1310b22008-01-24 16:13:08 -0500173static int mergable_maps(struct extent_map *prev, struct extent_map *next)
Chris Masona52d9a82007-08-27 16:49:44 -0400174{
Chris Mason7f3c74f2008-07-18 12:01:11 -0400175 if (test_bit(EXTENT_FLAG_PINNED, &prev->flags))
176 return 0;
177
Chris Masonc8b97812008-10-29 14:49:59 -0400178 /*
179 * don't merge compressed extents, we need to know their
180 * actual size
181 */
182 if (test_bit(EXTENT_FLAG_COMPRESSED, &prev->flags))
183 return 0;
184
Chris Masond1310b22008-01-24 16:13:08 -0500185 if (extent_map_end(prev) == next->start &&
186 prev->flags == next->flags &&
187 prev->bdev == next->bdev &&
188 ((next->block_start == EXTENT_MAP_HOLE &&
189 prev->block_start == EXTENT_MAP_HOLE) ||
190 (next->block_start == EXTENT_MAP_INLINE &&
191 prev->block_start == EXTENT_MAP_INLINE) ||
192 (next->block_start == EXTENT_MAP_DELALLOC &&
193 prev->block_start == EXTENT_MAP_DELALLOC) ||
194 (next->block_start < EXTENT_MAP_LAST_BYTE - 1 &&
195 next->block_start == extent_map_block_end(prev)))) {
196 return 1;
197 }
Chris Masona52d9a82007-08-27 16:49:44 -0400198 return 0;
199}
200
Christoph Hellwig9d2423c2008-06-11 21:52:17 -0400201/**
202 * add_extent_mapping - add new extent map to the extent tree
203 * @tree: tree to insert new map in
204 * @em: map to insert
205 *
206 * Insert @em into @tree or perform a simple forward/backward merge with
207 * existing mappings. The extent_map struct passed in will be inserted
208 * into the tree directly, with an additional reference taken, or a
209 * reference dropped if the merge attempt was sucessfull.
Chris Masona52d9a82007-08-27 16:49:44 -0400210 */
211int add_extent_mapping(struct extent_map_tree *tree,
212 struct extent_map *em)
213{
214 int ret = 0;
Chris Masond1310b22008-01-24 16:13:08 -0500215 struct extent_map *merge = NULL;
Chris Masona52d9a82007-08-27 16:49:44 -0400216 struct rb_node *rb;
Chris Mason7c2fe322008-08-20 08:51:50 -0400217 struct extent_map *exist;
Chris Masona52d9a82007-08-27 16:49:44 -0400218
Chris Mason7c2fe322008-08-20 08:51:50 -0400219 exist = lookup_extent_mapping(tree, em->start, em->len);
220 if (exist) {
221 free_extent_map(exist);
222 ret = -EEXIST;
223 goto out;
224 }
David Woodhouse64f26f72008-07-24 10:09:43 -0400225 assert_spin_locked(&tree->lock);
Chris Masond1310b22008-01-24 16:13:08 -0500226 rb = tree_insert(&tree->map, em->start, &em->rb_node);
Chris Masona52d9a82007-08-27 16:49:44 -0400227 if (rb) {
Chris Masona52d9a82007-08-27 16:49:44 -0400228 ret = -EEXIST;
229 goto out;
230 }
231 atomic_inc(&em->refs);
232 if (em->start != 0) {
233 rb = rb_prev(&em->rb_node);
234 if (rb)
Chris Masond1310b22008-01-24 16:13:08 -0500235 merge = rb_entry(rb, struct extent_map, rb_node);
236 if (rb && mergable_maps(merge, em)) {
237 em->start = merge->start;
238 em->len += merge->len;
Chris Masonc8b97812008-10-29 14:49:59 -0400239 em->block_len += merge->block_len;
Chris Masond1310b22008-01-24 16:13:08 -0500240 em->block_start = merge->block_start;
241 merge->in_tree = 0;
242 rb_erase(&merge->rb_node, &tree->map);
243 free_extent_map(merge);
Chris Masona52d9a82007-08-27 16:49:44 -0400244 }
245 }
Chris Masond1310b22008-01-24 16:13:08 -0500246 rb = rb_next(&em->rb_node);
247 if (rb)
248 merge = rb_entry(rb, struct extent_map, rb_node);
249 if (rb && mergable_maps(em, merge)) {
250 em->len += merge->len;
Chris Masonc8b97812008-10-29 14:49:59 -0400251 em->block_len += merge->len;
Chris Masond1310b22008-01-24 16:13:08 -0500252 rb_erase(&merge->rb_node, &tree->map);
253 merge->in_tree = 0;
254 free_extent_map(merge);
255 }
Chris Masona52d9a82007-08-27 16:49:44 -0400256out:
Chris Masona52d9a82007-08-27 16:49:44 -0400257 return ret;
258}
Chris Masona52d9a82007-08-27 16:49:44 -0400259
Chris Masond352ac62008-09-29 15:18:18 -0400260/* simple helper to do math around the end of an extent, handling wrap */
Chris Masond1310b22008-01-24 16:13:08 -0500261static u64 range_end(u64 start, u64 len)
262{
263 if (start + len < start)
264 return (u64)-1;
265 return start + len;
266}
267
Christoph Hellwig9d2423c2008-06-11 21:52:17 -0400268/**
269 * lookup_extent_mapping - lookup extent_map
270 * @tree: tree to lookup in
271 * @start: byte offset to start the search
272 * @len: length of the lookup range
273 *
274 * Find and return the first extent_map struct in @tree that intersects the
275 * [start, len] range. There may be additional objects in the tree that
276 * intersect, so check the object returned carefully to make sure that no
277 * additional lookups are needed.
Chris Masona52d9a82007-08-27 16:49:44 -0400278 */
279struct extent_map *lookup_extent_mapping(struct extent_map_tree *tree,
Chris Masond1310b22008-01-24 16:13:08 -0500280 u64 start, u64 len)
Chris Masona52d9a82007-08-27 16:49:44 -0400281{
282 struct extent_map *em;
283 struct rb_node *rb_node;
Christoph Hellwig306929f2008-06-10 10:21:04 -0400284 struct rb_node *prev = NULL;
285 struct rb_node *next = NULL;
286 u64 end = range_end(start, len);
287
David Woodhouse64f26f72008-07-24 10:09:43 -0400288 assert_spin_locked(&tree->lock);
Chris Mason5f564062008-01-22 16:47:59 -0500289 rb_node = __tree_search(&tree->map, start, &prev, &next);
290 if (!rb_node && prev) {
291 em = rb_entry(prev, struct extent_map, rb_node);
Chris Masond1310b22008-01-24 16:13:08 -0500292 if (end > em->start && start < extent_map_end(em))
Chris Mason5f564062008-01-22 16:47:59 -0500293 goto found;
294 }
295 if (!rb_node && next) {
296 em = rb_entry(next, struct extent_map, rb_node);
Chris Masond1310b22008-01-24 16:13:08 -0500297 if (end > em->start && start < extent_map_end(em))
Chris Mason5f564062008-01-22 16:47:59 -0500298 goto found;
299 }
Chris Masona52d9a82007-08-27 16:49:44 -0400300 if (!rb_node) {
301 em = NULL;
302 goto out;
303 }
304 if (IS_ERR(rb_node)) {
305 em = ERR_PTR(PTR_ERR(rb_node));
306 goto out;
307 }
308 em = rb_entry(rb_node, struct extent_map, rb_node);
Chris Masond1310b22008-01-24 16:13:08 -0500309 if (end > em->start && start < extent_map_end(em))
310 goto found;
311
312 em = NULL;
313 goto out;
314
Chris Mason5f564062008-01-22 16:47:59 -0500315found:
Chris Masona52d9a82007-08-27 16:49:44 -0400316 atomic_inc(&em->refs);
317out:
Chris Masona52d9a82007-08-27 16:49:44 -0400318 return em;
319}
Chris Masona52d9a82007-08-27 16:49:44 -0400320
Christoph Hellwig9d2423c2008-06-11 21:52:17 -0400321/**
322 * remove_extent_mapping - removes an extent_map from the extent tree
323 * @tree: extent tree to remove from
324 * @em: extent map beeing removed
325 *
326 * Removes @em from @tree. No reference counts are dropped, and no checks
327 * are done to see if the range is in use
Chris Masona52d9a82007-08-27 16:49:44 -0400328 */
329int remove_extent_mapping(struct extent_map_tree *tree, struct extent_map *em)
330{
Chris Masond1310b22008-01-24 16:13:08 -0500331 int ret = 0;
Chris Masona52d9a82007-08-27 16:49:44 -0400332
Chris Mason7f3c74f2008-07-18 12:01:11 -0400333 WARN_ON(test_bit(EXTENT_FLAG_PINNED, &em->flags));
David Woodhouse64f26f72008-07-24 10:09:43 -0400334 assert_spin_locked(&tree->lock);
Chris Masond1310b22008-01-24 16:13:08 -0500335 rb_erase(&em->rb_node, &tree->map);
336 em->in_tree = 0;
Chris Masona52d9a82007-08-27 16:49:44 -0400337 return ret;
338}