blob: 813425df16f77af34ca2d2ba7408e3f92a45249b [file] [log] [blame]
Greg Kroah-Hartmanb2441312017-11-01 15:07:57 +01001// SPDX-License-Identifier: GPL-2.0
David Sterbac1d7c512018-04-03 19:23:33 +02002
Chris Masond1310b22008-01-24 16:13:08 -05003#include <linux/err.h>
Chris Masond1310b22008-01-24 16:13:08 -05004#include <linux/slab.h>
Chris Masona52d9a82007-08-27 16:49:44 -04005#include <linux/spinlock.h>
Li Zefan261507a02010-12-17 14:21:50 +08006#include "ctree.h"
Chris Masona52d9a82007-08-27 16:49:44 -04007#include "extent_map.h"
Anand Jainebb87652016-03-10 17:26:59 +08008#include "compression.h"
Chris Masona52d9a82007-08-27 16:49:44 -04009
Chris Mason86479a02007-09-10 19:58:16 -040010
Chris Masona52d9a82007-08-27 16:49:44 -040011static struct kmem_cache *extent_map_cache;
Chris Masonca664622007-11-27 11:16:35 -050012
Wyatt Banks2f4cbe62007-11-19 10:22:33 -050013int __init extent_map_init(void)
Chris Masona52d9a82007-08-27 16:49:44 -040014{
David Sterba837e1972012-09-07 03:00:48 -060015 extent_map_cache = kmem_cache_create("btrfs_extent_map",
Christoph Hellwig9601e3f2009-04-13 15:33:09 +020016 sizeof(struct extent_map), 0,
Nikolay Borisovfba4b692016-06-23 21:17:08 +030017 SLAB_MEM_SPREAD, NULL);
Wyatt Banks2f4cbe62007-11-19 10:22:33 -050018 if (!extent_map_cache)
19 return -ENOMEM;
Wyatt Banks2f4cbe62007-11-19 10:22:33 -050020 return 0;
Chris Masona52d9a82007-08-27 16:49:44 -040021}
22
David Sterbae67c7182018-02-19 17:24:18 +010023void __cold extent_map_exit(void)
Chris Masona52d9a82007-08-27 16:49:44 -040024{
Kinglong Mee5598e902016-01-29 21:36:35 +080025 kmem_cache_destroy(extent_map_cache);
Chris Masona52d9a82007-08-27 16:49:44 -040026}
27
Christoph Hellwig9d2423c2008-06-11 21:52:17 -040028/**
29 * extent_map_tree_init - initialize extent map tree
30 * @tree: tree to initialize
Christoph Hellwig9d2423c2008-06-11 21:52:17 -040031 *
32 * Initialize the extent tree @tree. Should be called for each new inode
33 * or other user of the extent_map interface.
34 */
David Sterbaa8067e02011-04-21 00:34:43 +020035void extent_map_tree_init(struct extent_map_tree *tree)
Chris Masona52d9a82007-08-27 16:49:44 -040036{
Eric Paris6bef4d32010-02-23 19:43:04 +000037 tree->map = RB_ROOT;
Josef Bacik5dc562c2012-08-17 13:14:17 -040038 INIT_LIST_HEAD(&tree->modified_extents);
Chris Mason890871b2009-09-02 16:24:52 -040039 rwlock_init(&tree->lock);
Chris Masona52d9a82007-08-27 16:49:44 -040040}
Chris Masona52d9a82007-08-27 16:49:44 -040041
Christoph Hellwig9d2423c2008-06-11 21:52:17 -040042/**
43 * alloc_extent_map - allocate new extent map structure
Christoph Hellwig9d2423c2008-06-11 21:52:17 -040044 *
45 * Allocate a new extent_map structure. The new structure is
46 * returned with a reference count of one and needs to be
47 * freed using free_extent_map()
48 */
David Sterba172ddd62011-04-21 00:48:27 +020049struct extent_map *alloc_extent_map(void)
Chris Masona52d9a82007-08-27 16:49:44 -040050{
51 struct extent_map *em;
Josef Bacik70c8a912012-10-11 16:54:30 -040052 em = kmem_cache_zalloc(extent_map_cache, GFP_NOFS);
Tsutomu Itohc26a9202011-02-14 00:45:29 +000053 if (!em)
54 return NULL;
Filipe Mananacbc0e922014-02-25 14:15:12 +000055 RB_CLEAR_NODE(&em->rb_node);
Chris Masond1310b22008-01-24 16:13:08 -050056 em->flags = 0;
Li Zefan261507a02010-12-17 14:21:50 +080057 em->compress_type = BTRFS_COMPRESS_NONE;
Josef Bacik5dc562c2012-08-17 13:14:17 -040058 em->generation = 0;
Elena Reshetova490b54d2017-03-03 10:55:12 +020059 refcount_set(&em->refs, 1);
Josef Bacik5dc562c2012-08-17 13:14:17 -040060 INIT_LIST_HEAD(&em->list);
Chris Masona52d9a82007-08-27 16:49:44 -040061 return em;
62}
Chris Masona52d9a82007-08-27 16:49:44 -040063
Christoph Hellwig9d2423c2008-06-11 21:52:17 -040064/**
65 * free_extent_map - drop reference count of an extent_map
Nicholas D Steeves01327612016-05-19 21:18:45 -040066 * @em: extent map being released
Christoph Hellwig9d2423c2008-06-11 21:52:17 -040067 *
68 * Drops the reference out on @em by one and free the structure
69 * if the reference count hits zero.
70 */
Chris Masona52d9a82007-08-27 16:49:44 -040071void free_extent_map(struct extent_map *em)
72{
Chris Mason2bf5a722007-08-30 11:54:02 -040073 if (!em)
74 return;
Elena Reshetova490b54d2017-03-03 10:55:12 +020075 WARN_ON(refcount_read(&em->refs) == 0);
76 if (refcount_dec_and_test(&em->refs)) {
Filipe Mananacbc0e922014-02-25 14:15:12 +000077 WARN_ON(extent_map_in_tree(em));
Josef Bacik5dc562c2012-08-17 13:14:17 -040078 WARN_ON(!list_empty(&em->list));
Wang Shilong298a8f92014-06-19 10:42:52 +080079 if (test_bit(EXTENT_FLAG_FS_MAPPING, &em->flags))
Jeff Mahoney95617d62015-06-03 10:55:48 -040080 kfree(em->map_lookup);
Chris Masona52d9a82007-08-27 16:49:44 -040081 kmem_cache_free(extent_map_cache, em);
82 }
83}
Chris Masona52d9a82007-08-27 16:49:44 -040084
Filipe David Borba Manana32193c12013-11-25 03:23:51 +000085/* simple helper to do math around the end of an extent, handling wrap */
86static u64 range_end(u64 start, u64 len)
87{
88 if (start + len < start)
89 return (u64)-1;
90 return start + len;
91}
92
93static int tree_insert(struct rb_root *root, struct extent_map *em)
Chris Masona52d9a82007-08-27 16:49:44 -040094{
Chris Masond3977122009-01-05 21:25:51 -050095 struct rb_node **p = &root->rb_node;
96 struct rb_node *parent = NULL;
Filipe David Borba Manana32193c12013-11-25 03:23:51 +000097 struct extent_map *entry = NULL;
98 struct rb_node *orig_parent = NULL;
99 u64 end = range_end(em->start, em->len);
Chris Masona52d9a82007-08-27 16:49:44 -0400100
Chris Masond3977122009-01-05 21:25:51 -0500101 while (*p) {
Chris Masona52d9a82007-08-27 16:49:44 -0400102 parent = *p;
Chris Masond1310b22008-01-24 16:13:08 -0500103 entry = rb_entry(parent, struct extent_map, rb_node);
104
Filipe David Borba Manana32193c12013-11-25 03:23:51 +0000105 if (em->start < entry->start)
Chris Masona52d9a82007-08-27 16:49:44 -0400106 p = &(*p)->rb_left;
Filipe David Borba Manana32193c12013-11-25 03:23:51 +0000107 else if (em->start >= extent_map_end(entry))
Chris Masona52d9a82007-08-27 16:49:44 -0400108 p = &(*p)->rb_right;
109 else
Filipe David Borba Manana32193c12013-11-25 03:23:51 +0000110 return -EEXIST;
Chris Masona52d9a82007-08-27 16:49:44 -0400111 }
112
Filipe David Borba Manana32193c12013-11-25 03:23:51 +0000113 orig_parent = parent;
114 while (parent && em->start >= extent_map_end(entry)) {
115 parent = rb_next(parent);
116 entry = rb_entry(parent, struct extent_map, rb_node);
117 }
118 if (parent)
119 if (end > entry->start && em->start < extent_map_end(entry))
120 return -EEXIST;
121
122 parent = orig_parent;
123 entry = rb_entry(parent, struct extent_map, rb_node);
124 while (parent && em->start < entry->start) {
125 parent = rb_prev(parent);
126 entry = rb_entry(parent, struct extent_map, rb_node);
127 }
128 if (parent)
129 if (end > entry->start && em->start < extent_map_end(entry))
130 return -EEXIST;
131
Filipe David Borba Manana32193c12013-11-25 03:23:51 +0000132 rb_link_node(&em->rb_node, orig_parent, p);
133 rb_insert_color(&em->rb_node, root);
134 return 0;
Chris Masona52d9a82007-08-27 16:49:44 -0400135}
136
Chris Masond352ac62008-09-29 15:18:18 -0400137/*
138 * search through the tree for an extent_map with a given offset. If
139 * it can't be found, try to find some neighboring extents
140 */
Chris Masona52d9a82007-08-27 16:49:44 -0400141static struct rb_node *__tree_search(struct rb_root *root, u64 offset,
Chris Mason5f564062008-01-22 16:47:59 -0500142 struct rb_node **prev_ret,
143 struct rb_node **next_ret)
Chris Masona52d9a82007-08-27 16:49:44 -0400144{
Chris Masond3977122009-01-05 21:25:51 -0500145 struct rb_node *n = root->rb_node;
Chris Masona52d9a82007-08-27 16:49:44 -0400146 struct rb_node *prev = NULL;
Chris Mason5f564062008-01-22 16:47:59 -0500147 struct rb_node *orig_prev = NULL;
Chris Masond1310b22008-01-24 16:13:08 -0500148 struct extent_map *entry;
149 struct extent_map *prev_entry = NULL;
Chris Masona52d9a82007-08-27 16:49:44 -0400150
Chris Masond3977122009-01-05 21:25:51 -0500151 while (n) {
Chris Masond1310b22008-01-24 16:13:08 -0500152 entry = rb_entry(n, struct extent_map, rb_node);
Chris Masona52d9a82007-08-27 16:49:44 -0400153 prev = n;
154 prev_entry = entry;
155
156 if (offset < entry->start)
157 n = n->rb_left;
Chris Masond1310b22008-01-24 16:13:08 -0500158 else if (offset >= extent_map_end(entry))
Chris Masona52d9a82007-08-27 16:49:44 -0400159 n = n->rb_right;
160 else
161 return n;
162 }
Chris Mason5f564062008-01-22 16:47:59 -0500163
164 if (prev_ret) {
165 orig_prev = prev;
Chris Masond3977122009-01-05 21:25:51 -0500166 while (prev && offset >= extent_map_end(prev_entry)) {
Chris Mason5f564062008-01-22 16:47:59 -0500167 prev = rb_next(prev);
Chris Masond1310b22008-01-24 16:13:08 -0500168 prev_entry = rb_entry(prev, struct extent_map, rb_node);
Chris Mason5f564062008-01-22 16:47:59 -0500169 }
170 *prev_ret = prev;
171 prev = orig_prev;
Chris Masona52d9a82007-08-27 16:49:44 -0400172 }
Chris Mason5f564062008-01-22 16:47:59 -0500173
174 if (next_ret) {
Chris Masond1310b22008-01-24 16:13:08 -0500175 prev_entry = rb_entry(prev, struct extent_map, rb_node);
Chris Masond3977122009-01-05 21:25:51 -0500176 while (prev && offset < prev_entry->start) {
Chris Mason5f564062008-01-22 16:47:59 -0500177 prev = rb_prev(prev);
Chris Masond1310b22008-01-24 16:13:08 -0500178 prev_entry = rb_entry(prev, struct extent_map, rb_node);
Chris Mason5f564062008-01-22 16:47:59 -0500179 }
180 *next_ret = prev;
181 }
Chris Masona52d9a82007-08-27 16:49:44 -0400182 return NULL;
183}
184
Chris Masond352ac62008-09-29 15:18:18 -0400185/* check to see if two extent_map structs are adjacent and safe to merge */
Chris Masond1310b22008-01-24 16:13:08 -0500186static int mergable_maps(struct extent_map *prev, struct extent_map *next)
Chris Masona52d9a82007-08-27 16:49:44 -0400187{
Chris Mason7f3c74f2008-07-18 12:01:11 -0400188 if (test_bit(EXTENT_FLAG_PINNED, &prev->flags))
189 return 0;
190
Chris Masonc8b97812008-10-29 14:49:59 -0400191 /*
192 * don't merge compressed extents, we need to know their
193 * actual size
194 */
195 if (test_bit(EXTENT_FLAG_COMPRESSED, &prev->flags))
196 return 0;
197
Josef Bacik201a9032013-01-24 12:02:07 -0500198 if (test_bit(EXTENT_FLAG_LOGGING, &prev->flags) ||
199 test_bit(EXTENT_FLAG_LOGGING, &next->flags))
200 return 0;
201
Josef Bacik09a2a8f92013-04-05 16:51:15 -0400202 /*
203 * We don't want to merge stuff that hasn't been written to the log yet
204 * since it may not reflect exactly what is on disk, and that would be
205 * bad.
206 */
207 if (!list_empty(&prev->list) || !list_empty(&next->list))
208 return 0;
209
Chris Masond1310b22008-01-24 16:13:08 -0500210 if (extent_map_end(prev) == next->start &&
211 prev->flags == next->flags &&
212 prev->bdev == next->bdev &&
213 ((next->block_start == EXTENT_MAP_HOLE &&
214 prev->block_start == EXTENT_MAP_HOLE) ||
215 (next->block_start == EXTENT_MAP_INLINE &&
216 prev->block_start == EXTENT_MAP_INLINE) ||
217 (next->block_start == EXTENT_MAP_DELALLOC &&
218 prev->block_start == EXTENT_MAP_DELALLOC) ||
219 (next->block_start < EXTENT_MAP_LAST_BYTE - 1 &&
220 next->block_start == extent_map_block_end(prev)))) {
221 return 1;
222 }
Chris Masona52d9a82007-08-27 16:49:44 -0400223 return 0;
224}
225
Li Zefan4d2c8f622011-07-14 03:18:33 +0000226static void try_merge_map(struct extent_map_tree *tree, struct extent_map *em)
Chris Masona1ed8352009-09-11 12:27:37 -0400227{
Chris Masona1ed8352009-09-11 12:27:37 -0400228 struct extent_map *merge = NULL;
229 struct rb_node *rb;
Chris Masona1ed8352009-09-11 12:27:37 -0400230
Filipe Manana4a4257c2020-01-31 14:06:07 +0000231 /*
232 * We can't modify an extent map that is in the tree and that is being
233 * used by another task, as it can cause that other task to see it in
234 * inconsistent state during the merging. We always have 1 reference for
235 * the tree and 1 for this task (which is unpinning the extent map or
236 * clearing the logging flag), so anything > 2 means it's being used by
237 * other tasks too.
238 */
239 if (refcount_read(&em->refs) > 2)
240 return;
241
Chris Masona1ed8352009-09-11 12:27:37 -0400242 if (em->start != 0) {
243 rb = rb_prev(&em->rb_node);
244 if (rb)
245 merge = rb_entry(rb, struct extent_map, rb_node);
246 if (rb && mergable_maps(merge, em)) {
247 em->start = merge->start;
Josef Bacik70c8a912012-10-11 16:54:30 -0400248 em->orig_start = merge->orig_start;
Chris Masona1ed8352009-09-11 12:27:37 -0400249 em->len += merge->len;
250 em->block_len += merge->block_len;
251 em->block_start = merge->block_start;
Josef Bacik70c8a912012-10-11 16:54:30 -0400252 em->mod_len = (em->mod_len + em->mod_start) - merge->mod_start;
253 em->mod_start = merge->mod_start;
254 em->generation = max(em->generation, merge->generation);
Josef Bacik5dc562c2012-08-17 13:14:17 -0400255
Chris Masona1ed8352009-09-11 12:27:37 -0400256 rb_erase(&merge->rb_node, &tree->map);
Filipe Mananacbc0e922014-02-25 14:15:12 +0000257 RB_CLEAR_NODE(&merge->rb_node);
Chris Masona1ed8352009-09-11 12:27:37 -0400258 free_extent_map(merge);
259 }
260 }
261
262 rb = rb_next(&em->rb_node);
263 if (rb)
264 merge = rb_entry(rb, struct extent_map, rb_node);
265 if (rb && mergable_maps(em, merge)) {
266 em->len += merge->len;
Filipe David Borba Mananad527afe2013-11-30 11:28:35 +0000267 em->block_len += merge->block_len;
Chris Masona1ed8352009-09-11 12:27:37 -0400268 rb_erase(&merge->rb_node, &tree->map);
Filipe Mananacbc0e922014-02-25 14:15:12 +0000269 RB_CLEAR_NODE(&merge->rb_node);
Josef Bacik70c8a912012-10-11 16:54:30 -0400270 em->mod_len = (merge->mod_start + merge->mod_len) - em->mod_start;
271 em->generation = max(em->generation, merge->generation);
Chris Masona1ed8352009-09-11 12:27:37 -0400272 free_extent_map(merge);
273 }
Li Zefan4d2c8f622011-07-14 03:18:33 +0000274}
275
Josef Bacik5dc562c2012-08-17 13:14:17 -0400276/**
Liu Bo52b1de92012-10-30 17:13:52 +0800277 * unpin_extent_cache - unpin an extent from the cache
Josef Bacik5dc562c2012-08-17 13:14:17 -0400278 * @tree: tree to unpin the extent in
279 * @start: logical offset in the file
280 * @len: length of the extent
281 * @gen: generation that this extent has been modified in
Josef Bacik5dc562c2012-08-17 13:14:17 -0400282 *
283 * Called after an extent has been written to disk properly. Set the generation
284 * to the generation that actually added the file item to the inode so we know
285 * we need to sync this extent when we call fsync().
286 */
287int unpin_extent_cache(struct extent_map_tree *tree, u64 start, u64 len,
288 u64 gen)
Li Zefan4d2c8f622011-07-14 03:18:33 +0000289{
290 int ret = 0;
291 struct extent_map *em;
Liu Bo4e2f84e2012-08-27 10:52:20 -0600292 bool prealloc = false;
Li Zefan4d2c8f622011-07-14 03:18:33 +0000293
294 write_lock(&tree->lock);
295 em = lookup_extent_mapping(tree, start, len);
296
297 WARN_ON(!em || em->start != start);
298
299 if (!em)
300 goto out;
301
Josef Bacik5dc562c2012-08-17 13:14:17 -0400302 em->generation = gen;
Li Zefan4d2c8f622011-07-14 03:18:33 +0000303 clear_bit(EXTENT_FLAG_PINNED, &em->flags);
Liu Bo4e2f84e2012-08-27 10:52:20 -0600304 em->mod_start = em->start;
305 em->mod_len = em->len;
306
Josef Bacikb11e2342012-12-03 10:58:15 -0500307 if (test_bit(EXTENT_FLAG_FILLING, &em->flags)) {
Liu Bo4e2f84e2012-08-27 10:52:20 -0600308 prealloc = true;
Josef Bacikb11e2342012-12-03 10:58:15 -0500309 clear_bit(EXTENT_FLAG_FILLING, &em->flags);
Liu Bo4e2f84e2012-08-27 10:52:20 -0600310 }
Li Zefan4d2c8f622011-07-14 03:18:33 +0000311
312 try_merge_map(tree, em);
Liu Bo4e2f84e2012-08-27 10:52:20 -0600313
314 if (prealloc) {
315 em->mod_start = em->start;
316 em->mod_len = em->len;
317 }
318
Chris Masona1ed8352009-09-11 12:27:37 -0400319 free_extent_map(em);
320out:
321 write_unlock(&tree->lock);
322 return ret;
323
324}
325
Josef Bacik201a9032013-01-24 12:02:07 -0500326void clear_em_logging(struct extent_map_tree *tree, struct extent_map *em)
327{
328 clear_bit(EXTENT_FLAG_LOGGING, &em->flags);
Filipe Mananacbc0e922014-02-25 14:15:12 +0000329 if (extent_map_in_tree(em))
Josef Bacik222c81d2013-01-28 09:45:20 -0500330 try_merge_map(tree, em);
Josef Bacik201a9032013-01-24 12:02:07 -0500331}
332
Filipe Manana176840b2014-02-25 14:15:13 +0000333static inline void setup_extent_mapping(struct extent_map_tree *tree,
334 struct extent_map *em,
335 int modified)
336{
Elena Reshetova490b54d2017-03-03 10:55:12 +0200337 refcount_inc(&em->refs);
Filipe Manana176840b2014-02-25 14:15:13 +0000338 em->mod_start = em->start;
339 em->mod_len = em->len;
340
341 if (modified)
342 list_move(&em->list, &tree->modified_extents);
343 else
344 try_merge_map(tree, em);
345}
346
Christoph Hellwig9d2423c2008-06-11 21:52:17 -0400347/**
348 * add_extent_mapping - add new extent map to the extent tree
349 * @tree: tree to insert new map in
350 * @em: map to insert
351 *
352 * Insert @em into @tree or perform a simple forward/backward merge with
353 * existing mappings. The extent_map struct passed in will be inserted
354 * into the tree directly, with an additional reference taken, or a
Lucas De Marchi25985ed2011-03-30 22:57:33 -0300355 * reference dropped if the merge attempt was successful.
Chris Masona52d9a82007-08-27 16:49:44 -0400356 */
357int add_extent_mapping(struct extent_map_tree *tree,
Josef Bacik09a2a8f92013-04-05 16:51:15 -0400358 struct extent_map *em, int modified)
Chris Masona52d9a82007-08-27 16:49:44 -0400359{
360 int ret = 0;
Chris Masona52d9a82007-08-27 16:49:44 -0400361
Filipe David Borba Manana32193c12013-11-25 03:23:51 +0000362 ret = tree_insert(&tree->map, em);
363 if (ret)
Chris Mason7c2fe322008-08-20 08:51:50 -0400364 goto out;
Filipe David Borba Manana32193c12013-11-25 03:23:51 +0000365
Filipe Manana176840b2014-02-25 14:15:13 +0000366 setup_extent_mapping(tree, em, modified);
Chris Masona52d9a82007-08-27 16:49:44 -0400367out:
Chris Masona52d9a82007-08-27 16:49:44 -0400368 return ret;
369}
Chris Masona52d9a82007-08-27 16:49:44 -0400370
Eric Sandeen48a3b632013-04-25 20:41:01 +0000371static struct extent_map *
372__lookup_extent_mapping(struct extent_map_tree *tree,
373 u64 start, u64 len, int strict)
Li Zefaned64f062011-07-14 03:18:15 +0000374{
375 struct extent_map *em;
376 struct rb_node *rb_node;
377 struct rb_node *prev = NULL;
378 struct rb_node *next = NULL;
379 u64 end = range_end(start, len);
380
381 rb_node = __tree_search(&tree->map, start, &prev, &next);
382 if (!rb_node) {
383 if (prev)
384 rb_node = prev;
385 else if (next)
386 rb_node = next;
387 else
388 return NULL;
389 }
390
391 em = rb_entry(rb_node, struct extent_map, rb_node);
392
393 if (strict && !(end > em->start && start < extent_map_end(em)))
394 return NULL;
395
Elena Reshetova490b54d2017-03-03 10:55:12 +0200396 refcount_inc(&em->refs);
Li Zefaned64f062011-07-14 03:18:15 +0000397 return em;
398}
399
Christoph Hellwig9d2423c2008-06-11 21:52:17 -0400400/**
401 * lookup_extent_mapping - lookup extent_map
402 * @tree: tree to lookup in
403 * @start: byte offset to start the search
404 * @len: length of the lookup range
405 *
406 * Find and return the first extent_map struct in @tree that intersects the
407 * [start, len] range. There may be additional objects in the tree that
408 * intersect, so check the object returned carefully to make sure that no
409 * additional lookups are needed.
Chris Masona52d9a82007-08-27 16:49:44 -0400410 */
411struct extent_map *lookup_extent_mapping(struct extent_map_tree *tree,
Chris Masond1310b22008-01-24 16:13:08 -0500412 u64 start, u64 len)
Chris Masona52d9a82007-08-27 16:49:44 -0400413{
Li Zefaned64f062011-07-14 03:18:15 +0000414 return __lookup_extent_mapping(tree, start, len, 1);
Chris Masona52d9a82007-08-27 16:49:44 -0400415}
Chris Masona52d9a82007-08-27 16:49:44 -0400416
Christoph Hellwig9d2423c2008-06-11 21:52:17 -0400417/**
Chris Masonb917b7c2009-09-18 16:07:03 -0400418 * search_extent_mapping - find a nearby extent map
419 * @tree: tree to lookup in
420 * @start: byte offset to start the search
421 * @len: length of the lookup range
422 *
423 * Find and return the first extent_map struct in @tree that intersects the
424 * [start, len] range.
425 *
426 * If one can't be found, any nearby extent may be returned
427 */
428struct extent_map *search_extent_mapping(struct extent_map_tree *tree,
429 u64 start, u64 len)
430{
Li Zefaned64f062011-07-14 03:18:15 +0000431 return __lookup_extent_mapping(tree, start, len, 0);
Chris Masonb917b7c2009-09-18 16:07:03 -0400432}
433
434/**
Christoph Hellwig9d2423c2008-06-11 21:52:17 -0400435 * remove_extent_mapping - removes an extent_map from the extent tree
436 * @tree: extent tree to remove from
Adam Buchbinderbb7ab3b2016-03-04 11:23:12 -0800437 * @em: extent map being removed
Christoph Hellwig9d2423c2008-06-11 21:52:17 -0400438 *
439 * Removes @em from @tree. No reference counts are dropped, and no checks
440 * are done to see if the range is in use
Chris Masona52d9a82007-08-27 16:49:44 -0400441 */
442int remove_extent_mapping(struct extent_map_tree *tree, struct extent_map *em)
443{
Chris Masond1310b22008-01-24 16:13:08 -0500444 int ret = 0;
Chris Masona52d9a82007-08-27 16:49:44 -0400445
Chris Mason7f3c74f2008-07-18 12:01:11 -0400446 WARN_ON(test_bit(EXTENT_FLAG_PINNED, &em->flags));
Chris Masond1310b22008-01-24 16:13:08 -0500447 rb_erase(&em->rb_node, &tree->map);
Josef Bacikff44c6e2012-09-14 12:59:20 -0400448 if (!test_bit(EXTENT_FLAG_LOGGING, &em->flags))
449 list_del_init(&em->list);
Filipe Mananacbc0e922014-02-25 14:15:12 +0000450 RB_CLEAR_NODE(&em->rb_node);
Chris Masona52d9a82007-08-27 16:49:44 -0400451 return ret;
452}
Filipe Manana176840b2014-02-25 14:15:13 +0000453
454void replace_extent_mapping(struct extent_map_tree *tree,
455 struct extent_map *cur,
456 struct extent_map *new,
457 int modified)
458{
459 WARN_ON(test_bit(EXTENT_FLAG_PINNED, &cur->flags));
460 ASSERT(extent_map_in_tree(cur));
461 if (!test_bit(EXTENT_FLAG_LOGGING, &cur->flags))
462 list_del_init(&cur->list);
463 rb_replace_node(&cur->rb_node, &new->rb_node, &tree->map);
464 RB_CLEAR_NODE(&cur->rb_node);
465
466 setup_extent_mapping(tree, new, modified);
467}
Liu Boc04e61b2018-01-05 12:51:11 -0700468
469static struct extent_map *next_extent_map(struct extent_map *em)
470{
471 struct rb_node *next;
472
473 next = rb_next(&em->rb_node);
474 if (!next)
475 return NULL;
476 return container_of(next, struct extent_map, rb_node);
477}
478
479static struct extent_map *prev_extent_map(struct extent_map *em)
480{
481 struct rb_node *prev;
482
483 prev = rb_prev(&em->rb_node);
484 if (!prev)
485 return NULL;
486 return container_of(prev, struct extent_map, rb_node);
487}
488
489/* helper for btfs_get_extent. Given an existing extent in the tree,
490 * the existing extent is the nearest extent to map_start,
491 * and an extent that you want to insert, deal with overlap and insert
492 * the best fitted new extent into the tree.
493 */
Liu Bo5f4791f2018-01-05 12:51:17 -0700494static noinline int merge_extent_mapping(struct extent_map_tree *em_tree,
495 struct extent_map *existing,
496 struct extent_map *em,
497 u64 map_start)
Liu Boc04e61b2018-01-05 12:51:11 -0700498{
499 struct extent_map *prev;
500 struct extent_map *next;
501 u64 start;
502 u64 end;
503 u64 start_diff;
504
505 BUG_ON(map_start < em->start || map_start >= extent_map_end(em));
506
507 if (existing->start > map_start) {
508 next = existing;
509 prev = prev_extent_map(next);
510 } else {
511 prev = existing;
512 next = next_extent_map(prev);
513 }
514
515 start = prev ? extent_map_end(prev) : em->start;
516 start = max_t(u64, start, em->start);
517 end = next ? next->start : extent_map_end(em);
518 end = min_t(u64, end, extent_map_end(em));
519 start_diff = start - em->start;
520 em->start = start;
521 em->len = end - start;
522 if (em->block_start < EXTENT_MAP_LAST_BYTE &&
523 !test_bit(EXTENT_FLAG_COMPRESSED, &em->flags)) {
524 em->block_start += start_diff;
525 em->block_len = em->len;
526 }
527 return add_extent_mapping(em_tree, em, 0);
528}
529
530/**
531 * btrfs_add_extent_mapping - add extent mapping into em_tree
David Sterbaf46b24c2018-04-03 21:45:57 +0200532 * @fs_info - used for tracepoint
Liu Boc04e61b2018-01-05 12:51:11 -0700533 * @em_tree - the extent tree into which we want to insert the extent mapping
534 * @em_in - extent we are inserting
535 * @start - start of the logical range btrfs_get_extent() is requesting
536 * @len - length of the logical range btrfs_get_extent() is requesting
537 *
538 * Note that @em_in's range may be different from [start, start+len),
539 * but they must be overlapped.
540 *
541 * Insert @em_in into @em_tree. In case there is an overlapping range, handle
542 * the -EEXIST by either:
543 * a) Returning the existing extent in @em_in if @start is within the
544 * existing em.
545 * b) Merge the existing extent with @em_in passed in.
546 *
547 * Return 0 on success, otherwise -EEXIST.
548 *
549 */
David Sterbaf46b24c2018-04-03 21:45:57 +0200550int btrfs_add_extent_mapping(struct btrfs_fs_info *fs_info,
551 struct extent_map_tree *em_tree,
Liu Boc04e61b2018-01-05 12:51:11 -0700552 struct extent_map **em_in, u64 start, u64 len)
553{
554 int ret;
555 struct extent_map *em = *em_in;
556
557 ret = add_extent_mapping(em_tree, em, 0);
558 /* it is possible that someone inserted the extent into the tree
559 * while we had the lock dropped. It is also possible that
560 * an overlapping map exists in the tree
561 */
562 if (ret == -EEXIST) {
563 struct extent_map *existing;
564
565 ret = 0;
566
567 existing = search_extent_mapping(em_tree, start, len);
Liu Bo393da912018-01-05 12:51:16 -0700568
David Sterbaf46b24c2018-04-03 21:45:57 +0200569 trace_btrfs_handle_em_exist(fs_info, existing, em, start, len);
Liu Bo393da912018-01-05 12:51:16 -0700570
Liu Boc04e61b2018-01-05 12:51:11 -0700571 /*
572 * existing will always be non-NULL, since there must be
573 * extent causing the -EEXIST.
574 */
575 if (start >= existing->start &&
576 start < extent_map_end(existing)) {
577 free_extent_map(em);
578 *em_in = existing;
579 ret = 0;
580 } else {
Liu Bo9a7e10e2018-01-05 12:51:15 -0700581 u64 orig_start = em->start;
582 u64 orig_len = em->len;
583
Liu Boc04e61b2018-01-05 12:51:11 -0700584 /*
585 * The existing extent map is the one nearest to
586 * the [start, start + len) range which overlaps
587 */
588 ret = merge_extent_mapping(em_tree, existing,
589 em, start);
Liu Boc04e61b2018-01-05 12:51:11 -0700590 if (ret) {
591 free_extent_map(em);
592 *em_in = NULL;
Liu Bo9a7e10e2018-01-05 12:51:15 -0700593 WARN_ONCE(ret,
594"unexpected error %d: merge existing(start %llu len %llu) with em(start %llu len %llu)\n",
595 ret, existing->start, existing->len,
596 orig_start, orig_len);
Liu Boc04e61b2018-01-05 12:51:11 -0700597 }
Liu Bo9a7e10e2018-01-05 12:51:15 -0700598 free_extent_map(existing);
Liu Boc04e61b2018-01-05 12:51:11 -0700599 }
600 }
601
602 ASSERT(ret == 0 || ret == -EEXIST);
603 return ret;
604}