blob: 454ca52d6451b649b78b48cba908f3fd1eb2bada [file] [log] [blame]
Chris Masond1310b22008-01-24 16:13:08 -05001#include <linux/err.h>
Chris Masond1310b22008-01-24 16:13:08 -05002#include <linux/slab.h>
Chris Masona52d9a82007-08-27 16:49:44 -04003#include <linux/module.h>
4#include <linux/spinlock.h>
Chris Masond1310b22008-01-24 16:13:08 -05005#include <linux/hardirq.h>
Chris Masona52d9a82007-08-27 16:49:44 -04006#include "extent_map.h"
7
Chris Mason86479a02007-09-10 19:58:16 -04008
Chris Masona52d9a82007-08-27 16:49:44 -04009static struct kmem_cache *extent_map_cache;
Chris Masonca664622007-11-27 11:16:35 -050010
Wyatt Banks2f4cbe62007-11-19 10:22:33 -050011int __init extent_map_init(void)
Chris Masona52d9a82007-08-27 16:49:44 -040012{
Christoph Hellwig9601e3f2009-04-13 15:33:09 +020013 extent_map_cache = kmem_cache_create("extent_map",
14 sizeof(struct extent_map), 0,
15 SLAB_RECLAIM_ACCOUNT | SLAB_MEM_SPREAD, NULL);
Wyatt Banks2f4cbe62007-11-19 10:22:33 -050016 if (!extent_map_cache)
17 return -ENOMEM;
Wyatt Banks2f4cbe62007-11-19 10:22:33 -050018 return 0;
Chris Masona52d9a82007-08-27 16:49:44 -040019}
20
Christian Hesse17636e02007-12-11 09:25:06 -050021void extent_map_exit(void)
Chris Masona52d9a82007-08-27 16:49:44 -040022{
Chris Masona52d9a82007-08-27 16:49:44 -040023 if (extent_map_cache)
24 kmem_cache_destroy(extent_map_cache);
Chris Masona52d9a82007-08-27 16:49:44 -040025}
26
Christoph Hellwig9d2423c2008-06-11 21:52:17 -040027/**
28 * extent_map_tree_init - initialize extent map tree
29 * @tree: tree to initialize
30 * @mask: flags for memory allocations during tree operations
31 *
32 * Initialize the extent tree @tree. Should be called for each new inode
33 * or other user of the extent_map interface.
34 */
Chris Masond1310b22008-01-24 16:13:08 -050035void extent_map_tree_init(struct extent_map_tree *tree, gfp_t mask)
Chris Masona52d9a82007-08-27 16:49:44 -040036{
Eric Paris6bef4d32010-02-23 19:43:04 +000037 tree->map = RB_ROOT;
Chris Mason890871b2009-09-02 16:24:52 -040038 rwlock_init(&tree->lock);
Chris Masona52d9a82007-08-27 16:49:44 -040039}
Chris Masona52d9a82007-08-27 16:49:44 -040040
Christoph Hellwig9d2423c2008-06-11 21:52:17 -040041/**
42 * alloc_extent_map - allocate new extent map structure
43 * @mask: memory allocation flags
44 *
45 * Allocate a new extent_map structure. The new structure is
46 * returned with a reference count of one and needs to be
47 * freed using free_extent_map()
48 */
Chris Masona52d9a82007-08-27 16:49:44 -040049struct extent_map *alloc_extent_map(gfp_t mask)
50{
51 struct extent_map *em;
52 em = kmem_cache_alloc(extent_map_cache, mask);
53 if (!em || IS_ERR(em))
54 return em;
55 em->in_tree = 0;
Chris Masond1310b22008-01-24 16:13:08 -050056 em->flags = 0;
Chris Masona52d9a82007-08-27 16:49:44 -040057 atomic_set(&em->refs, 1);
58 return em;
59}
Chris Masona52d9a82007-08-27 16:49:44 -040060
Christoph Hellwig9d2423c2008-06-11 21:52:17 -040061/**
62 * free_extent_map - drop reference count of an extent_map
63 * @em: extent map beeing releasead
64 *
65 * Drops the reference out on @em by one and free the structure
66 * if the reference count hits zero.
67 */
Chris Masona52d9a82007-08-27 16:49:44 -040068void free_extent_map(struct extent_map *em)
69{
Chris Mason2bf5a722007-08-30 11:54:02 -040070 if (!em)
71 return;
Chris Masond1310b22008-01-24 16:13:08 -050072 WARN_ON(atomic_read(&em->refs) == 0);
Chris Masona52d9a82007-08-27 16:49:44 -040073 if (atomic_dec_and_test(&em->refs)) {
74 WARN_ON(em->in_tree);
75 kmem_cache_free(extent_map_cache, em);
76 }
77}
Chris Masona52d9a82007-08-27 16:49:44 -040078
Chris Masona52d9a82007-08-27 16:49:44 -040079static struct rb_node *tree_insert(struct rb_root *root, u64 offset,
80 struct rb_node *node)
81{
Chris Masond3977122009-01-05 21:25:51 -050082 struct rb_node **p = &root->rb_node;
83 struct rb_node *parent = NULL;
Chris Masond1310b22008-01-24 16:13:08 -050084 struct extent_map *entry;
Chris Masona52d9a82007-08-27 16:49:44 -040085
Chris Masond3977122009-01-05 21:25:51 -050086 while (*p) {
Chris Masona52d9a82007-08-27 16:49:44 -040087 parent = *p;
Chris Masond1310b22008-01-24 16:13:08 -050088 entry = rb_entry(parent, struct extent_map, rb_node);
89
90 WARN_ON(!entry->in_tree);
Chris Masona52d9a82007-08-27 16:49:44 -040091
92 if (offset < entry->start)
93 p = &(*p)->rb_left;
Chris Masond1310b22008-01-24 16:13:08 -050094 else if (offset >= extent_map_end(entry))
Chris Masona52d9a82007-08-27 16:49:44 -040095 p = &(*p)->rb_right;
96 else
97 return parent;
98 }
99
Chris Masond1310b22008-01-24 16:13:08 -0500100 entry = rb_entry(node, struct extent_map, rb_node);
Chris Masona52d9a82007-08-27 16:49:44 -0400101 entry->in_tree = 1;
102 rb_link_node(node, parent, p);
103 rb_insert_color(node, root);
104 return NULL;
105}
106
Chris Masond352ac62008-09-29 15:18:18 -0400107/*
108 * search through the tree for an extent_map with a given offset. If
109 * it can't be found, try to find some neighboring extents
110 */
Chris Masona52d9a82007-08-27 16:49:44 -0400111static struct rb_node *__tree_search(struct rb_root *root, u64 offset,
Chris Mason5f564062008-01-22 16:47:59 -0500112 struct rb_node **prev_ret,
113 struct rb_node **next_ret)
Chris Masona52d9a82007-08-27 16:49:44 -0400114{
Chris Masond3977122009-01-05 21:25:51 -0500115 struct rb_node *n = root->rb_node;
Chris Masona52d9a82007-08-27 16:49:44 -0400116 struct rb_node *prev = NULL;
Chris Mason5f564062008-01-22 16:47:59 -0500117 struct rb_node *orig_prev = NULL;
Chris Masond1310b22008-01-24 16:13:08 -0500118 struct extent_map *entry;
119 struct extent_map *prev_entry = NULL;
Chris Masona52d9a82007-08-27 16:49:44 -0400120
Chris Masond3977122009-01-05 21:25:51 -0500121 while (n) {
Chris Masond1310b22008-01-24 16:13:08 -0500122 entry = rb_entry(n, struct extent_map, rb_node);
Chris Masona52d9a82007-08-27 16:49:44 -0400123 prev = n;
124 prev_entry = entry;
125
Chris Masond1310b22008-01-24 16:13:08 -0500126 WARN_ON(!entry->in_tree);
127
Chris Masona52d9a82007-08-27 16:49:44 -0400128 if (offset < entry->start)
129 n = n->rb_left;
Chris Masond1310b22008-01-24 16:13:08 -0500130 else if (offset >= extent_map_end(entry))
Chris Masona52d9a82007-08-27 16:49:44 -0400131 n = n->rb_right;
132 else
133 return n;
134 }
Chris Mason5f564062008-01-22 16:47:59 -0500135
136 if (prev_ret) {
137 orig_prev = prev;
Chris Masond3977122009-01-05 21:25:51 -0500138 while (prev && offset >= extent_map_end(prev_entry)) {
Chris Mason5f564062008-01-22 16:47:59 -0500139 prev = rb_next(prev);
Chris Masond1310b22008-01-24 16:13:08 -0500140 prev_entry = rb_entry(prev, struct extent_map, rb_node);
Chris Mason5f564062008-01-22 16:47:59 -0500141 }
142 *prev_ret = prev;
143 prev = orig_prev;
Chris Masona52d9a82007-08-27 16:49:44 -0400144 }
Chris Mason5f564062008-01-22 16:47:59 -0500145
146 if (next_ret) {
Chris Masond1310b22008-01-24 16:13:08 -0500147 prev_entry = rb_entry(prev, struct extent_map, rb_node);
Chris Masond3977122009-01-05 21:25:51 -0500148 while (prev && offset < prev_entry->start) {
Chris Mason5f564062008-01-22 16:47:59 -0500149 prev = rb_prev(prev);
Chris Masond1310b22008-01-24 16:13:08 -0500150 prev_entry = rb_entry(prev, struct extent_map, rb_node);
Chris Mason5f564062008-01-22 16:47:59 -0500151 }
152 *next_ret = prev;
153 }
Chris Masona52d9a82007-08-27 16:49:44 -0400154 return NULL;
155}
156
Chris Masond352ac62008-09-29 15:18:18 -0400157/* check to see if two extent_map structs are adjacent and safe to merge */
Chris Masond1310b22008-01-24 16:13:08 -0500158static int mergable_maps(struct extent_map *prev, struct extent_map *next)
Chris Masona52d9a82007-08-27 16:49:44 -0400159{
Chris Mason7f3c74f2008-07-18 12:01:11 -0400160 if (test_bit(EXTENT_FLAG_PINNED, &prev->flags))
161 return 0;
162
Chris Masonc8b97812008-10-29 14:49:59 -0400163 /*
164 * don't merge compressed extents, we need to know their
165 * actual size
166 */
167 if (test_bit(EXTENT_FLAG_COMPRESSED, &prev->flags))
168 return 0;
169
Chris Masond1310b22008-01-24 16:13:08 -0500170 if (extent_map_end(prev) == next->start &&
171 prev->flags == next->flags &&
172 prev->bdev == next->bdev &&
173 ((next->block_start == EXTENT_MAP_HOLE &&
174 prev->block_start == EXTENT_MAP_HOLE) ||
175 (next->block_start == EXTENT_MAP_INLINE &&
176 prev->block_start == EXTENT_MAP_INLINE) ||
177 (next->block_start == EXTENT_MAP_DELALLOC &&
178 prev->block_start == EXTENT_MAP_DELALLOC) ||
179 (next->block_start < EXTENT_MAP_LAST_BYTE - 1 &&
180 next->block_start == extent_map_block_end(prev)))) {
181 return 1;
182 }
Chris Masona52d9a82007-08-27 16:49:44 -0400183 return 0;
184}
185
Chris Masona1ed8352009-09-11 12:27:37 -0400186int unpin_extent_cache(struct extent_map_tree *tree, u64 start, u64 len)
187{
188 int ret = 0;
189 struct extent_map *merge = NULL;
190 struct rb_node *rb;
191 struct extent_map *em;
192
193 write_lock(&tree->lock);
194 em = lookup_extent_mapping(tree, start, len);
195
Dan Carpenter4eb39912009-11-10 09:01:43 +0000196 WARN_ON(!em || em->start != start);
Chris Masona1ed8352009-09-11 12:27:37 -0400197
198 if (!em)
199 goto out;
200
201 clear_bit(EXTENT_FLAG_PINNED, &em->flags);
202
203 if (em->start != 0) {
204 rb = rb_prev(&em->rb_node);
205 if (rb)
206 merge = rb_entry(rb, struct extent_map, rb_node);
207 if (rb && mergable_maps(merge, em)) {
208 em->start = merge->start;
209 em->len += merge->len;
210 em->block_len += merge->block_len;
211 em->block_start = merge->block_start;
212 merge->in_tree = 0;
213 rb_erase(&merge->rb_node, &tree->map);
214 free_extent_map(merge);
215 }
216 }
217
218 rb = rb_next(&em->rb_node);
219 if (rb)
220 merge = rb_entry(rb, struct extent_map, rb_node);
221 if (rb && mergable_maps(em, merge)) {
222 em->len += merge->len;
223 em->block_len += merge->len;
224 rb_erase(&merge->rb_node, &tree->map);
225 merge->in_tree = 0;
226 free_extent_map(merge);
227 }
228
229 free_extent_map(em);
230out:
231 write_unlock(&tree->lock);
232 return ret;
233
234}
235
Christoph Hellwig9d2423c2008-06-11 21:52:17 -0400236/**
237 * add_extent_mapping - add new extent map to the extent tree
238 * @tree: tree to insert new map in
239 * @em: map to insert
240 *
241 * Insert @em into @tree or perform a simple forward/backward merge with
242 * existing mappings. The extent_map struct passed in will be inserted
243 * into the tree directly, with an additional reference taken, or a
André Goddard Rosaaf901ca2009-11-14 13:09:05 -0200244 * reference dropped if the merge attempt was successfull.
Chris Masona52d9a82007-08-27 16:49:44 -0400245 */
246int add_extent_mapping(struct extent_map_tree *tree,
247 struct extent_map *em)
248{
249 int ret = 0;
Chris Masond1310b22008-01-24 16:13:08 -0500250 struct extent_map *merge = NULL;
Chris Masona52d9a82007-08-27 16:49:44 -0400251 struct rb_node *rb;
Chris Mason7c2fe322008-08-20 08:51:50 -0400252 struct extent_map *exist;
Chris Masona52d9a82007-08-27 16:49:44 -0400253
Chris Mason7c2fe322008-08-20 08:51:50 -0400254 exist = lookup_extent_mapping(tree, em->start, em->len);
255 if (exist) {
256 free_extent_map(exist);
257 ret = -EEXIST;
258 goto out;
259 }
Chris Masond1310b22008-01-24 16:13:08 -0500260 rb = tree_insert(&tree->map, em->start, &em->rb_node);
Chris Masona52d9a82007-08-27 16:49:44 -0400261 if (rb) {
Chris Masona52d9a82007-08-27 16:49:44 -0400262 ret = -EEXIST;
263 goto out;
264 }
265 atomic_inc(&em->refs);
266 if (em->start != 0) {
267 rb = rb_prev(&em->rb_node);
268 if (rb)
Chris Masond1310b22008-01-24 16:13:08 -0500269 merge = rb_entry(rb, struct extent_map, rb_node);
270 if (rb && mergable_maps(merge, em)) {
271 em->start = merge->start;
272 em->len += merge->len;
Chris Masonc8b97812008-10-29 14:49:59 -0400273 em->block_len += merge->block_len;
Chris Masond1310b22008-01-24 16:13:08 -0500274 em->block_start = merge->block_start;
275 merge->in_tree = 0;
276 rb_erase(&merge->rb_node, &tree->map);
277 free_extent_map(merge);
Chris Masona52d9a82007-08-27 16:49:44 -0400278 }
279 }
Chris Masond1310b22008-01-24 16:13:08 -0500280 rb = rb_next(&em->rb_node);
281 if (rb)
282 merge = rb_entry(rb, struct extent_map, rb_node);
283 if (rb && mergable_maps(em, merge)) {
284 em->len += merge->len;
Chris Masonc8b97812008-10-29 14:49:59 -0400285 em->block_len += merge->len;
Chris Masond1310b22008-01-24 16:13:08 -0500286 rb_erase(&merge->rb_node, &tree->map);
287 merge->in_tree = 0;
288 free_extent_map(merge);
289 }
Chris Masona52d9a82007-08-27 16:49:44 -0400290out:
Chris Masona52d9a82007-08-27 16:49:44 -0400291 return ret;
292}
Chris Masona52d9a82007-08-27 16:49:44 -0400293
Chris Masond352ac62008-09-29 15:18:18 -0400294/* simple helper to do math around the end of an extent, handling wrap */
Chris Masond1310b22008-01-24 16:13:08 -0500295static u64 range_end(u64 start, u64 len)
296{
297 if (start + len < start)
298 return (u64)-1;
299 return start + len;
300}
301
Christoph Hellwig9d2423c2008-06-11 21:52:17 -0400302/**
303 * lookup_extent_mapping - lookup extent_map
304 * @tree: tree to lookup in
305 * @start: byte offset to start the search
306 * @len: length of the lookup range
307 *
308 * Find and return the first extent_map struct in @tree that intersects the
309 * [start, len] range. There may be additional objects in the tree that
310 * intersect, so check the object returned carefully to make sure that no
311 * additional lookups are needed.
Chris Masona52d9a82007-08-27 16:49:44 -0400312 */
313struct extent_map *lookup_extent_mapping(struct extent_map_tree *tree,
Chris Masond1310b22008-01-24 16:13:08 -0500314 u64 start, u64 len)
Chris Masona52d9a82007-08-27 16:49:44 -0400315{
316 struct extent_map *em;
317 struct rb_node *rb_node;
Christoph Hellwig306929f2008-06-10 10:21:04 -0400318 struct rb_node *prev = NULL;
319 struct rb_node *next = NULL;
320 u64 end = range_end(start, len);
321
Chris Mason5f564062008-01-22 16:47:59 -0500322 rb_node = __tree_search(&tree->map, start, &prev, &next);
323 if (!rb_node && prev) {
324 em = rb_entry(prev, struct extent_map, rb_node);
Chris Masond1310b22008-01-24 16:13:08 -0500325 if (end > em->start && start < extent_map_end(em))
Chris Mason5f564062008-01-22 16:47:59 -0500326 goto found;
327 }
328 if (!rb_node && next) {
329 em = rb_entry(next, struct extent_map, rb_node);
Chris Masond1310b22008-01-24 16:13:08 -0500330 if (end > em->start && start < extent_map_end(em))
Chris Mason5f564062008-01-22 16:47:59 -0500331 goto found;
332 }
Chris Masona52d9a82007-08-27 16:49:44 -0400333 if (!rb_node) {
334 em = NULL;
335 goto out;
336 }
337 if (IS_ERR(rb_node)) {
338 em = ERR_PTR(PTR_ERR(rb_node));
339 goto out;
340 }
341 em = rb_entry(rb_node, struct extent_map, rb_node);
Chris Masond1310b22008-01-24 16:13:08 -0500342 if (end > em->start && start < extent_map_end(em))
343 goto found;
344
345 em = NULL;
346 goto out;
347
Chris Mason5f564062008-01-22 16:47:59 -0500348found:
Chris Masona52d9a82007-08-27 16:49:44 -0400349 atomic_inc(&em->refs);
350out:
Chris Masona52d9a82007-08-27 16:49:44 -0400351 return em;
352}
Chris Masona52d9a82007-08-27 16:49:44 -0400353
Christoph Hellwig9d2423c2008-06-11 21:52:17 -0400354/**
Chris Masonb917b7c2009-09-18 16:07:03 -0400355 * search_extent_mapping - find a nearby extent map
356 * @tree: tree to lookup in
357 * @start: byte offset to start the search
358 * @len: length of the lookup range
359 *
360 * Find and return the first extent_map struct in @tree that intersects the
361 * [start, len] range.
362 *
363 * If one can't be found, any nearby extent may be returned
364 */
365struct extent_map *search_extent_mapping(struct extent_map_tree *tree,
366 u64 start, u64 len)
367{
368 struct extent_map *em;
369 struct rb_node *rb_node;
370 struct rb_node *prev = NULL;
371 struct rb_node *next = NULL;
372
373 rb_node = __tree_search(&tree->map, start, &prev, &next);
374 if (!rb_node && prev) {
375 em = rb_entry(prev, struct extent_map, rb_node);
376 goto found;
377 }
378 if (!rb_node && next) {
379 em = rb_entry(next, struct extent_map, rb_node);
380 goto found;
381 }
382 if (!rb_node) {
383 em = NULL;
384 goto out;
385 }
386 if (IS_ERR(rb_node)) {
387 em = ERR_PTR(PTR_ERR(rb_node));
388 goto out;
389 }
390 em = rb_entry(rb_node, struct extent_map, rb_node);
391 goto found;
392
393 em = NULL;
394 goto out;
395
396found:
397 atomic_inc(&em->refs);
398out:
399 return em;
400}
401
402/**
Christoph Hellwig9d2423c2008-06-11 21:52:17 -0400403 * remove_extent_mapping - removes an extent_map from the extent tree
404 * @tree: extent tree to remove from
405 * @em: extent map beeing removed
406 *
407 * Removes @em from @tree. No reference counts are dropped, and no checks
408 * are done to see if the range is in use
Chris Masona52d9a82007-08-27 16:49:44 -0400409 */
410int remove_extent_mapping(struct extent_map_tree *tree, struct extent_map *em)
411{
Chris Masond1310b22008-01-24 16:13:08 -0500412 int ret = 0;
Chris Masona52d9a82007-08-27 16:49:44 -0400413
Chris Mason7f3c74f2008-07-18 12:01:11 -0400414 WARN_ON(test_bit(EXTENT_FLAG_PINNED, &em->flags));
Chris Masond1310b22008-01-24 16:13:08 -0500415 rb_erase(&em->rb_node, &tree->map);
416 em->in_tree = 0;
Chris Masona52d9a82007-08-27 16:49:44 -0400417 return ret;
418}