blob: fd8233e05cf4f6682ad6c9fcc76ef7913fd457ee [file] [log] [blame]
Chris Mason6cbd5572007-06-12 09:07:21 -04001/*
2 * Copyright (C) 2007 Oracle. All rights reserved.
3 *
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public
6 * License v2 as published by the Free Software Foundation.
7 *
8 * This program is distributed in the hope that it will be useful,
9 * but WITHOUT ANY WARRANTY; without even the implied warranty of
10 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
11 * General Public License for more details.
12 *
13 * You should have received a copy of the GNU General Public
14 * License along with this program; if not, write to the
15 * Free Software Foundation, Inc., 59 Temple Place - Suite 330,
16 * Boston, MA 021110-1307, USA.
17 */
18
Chris Masona6b6e752007-10-15 16:22:39 -040019#include <linux/sched.h>
Chris Masoneb60cea2007-02-02 09:18:22 -050020#include "ctree.h"
21#include "disk-io.h"
Chris Mason7f5c1512007-03-23 15:56:19 -040022#include "transaction.h"
Chris Mason5f39d392007-10-15 16:14:19 -040023#include "print-tree.h"
Chris Mason9a8dd152007-02-23 08:38:36 -050024
Chris Masone089f052007-03-16 16:20:31 -040025static int split_node(struct btrfs_trans_handle *trans, struct btrfs_root
26 *root, struct btrfs_path *path, int level);
27static int split_leaf(struct btrfs_trans_handle *trans, struct btrfs_root
Chris Masond4dbff92007-04-04 14:08:15 -040028 *root, struct btrfs_key *ins_key,
Chris Masoncc0c5532007-10-25 15:42:57 -040029 struct btrfs_path *path, int data_size, int extend);
Chris Mason5f39d392007-10-15 16:14:19 -040030static int push_node_left(struct btrfs_trans_handle *trans,
31 struct btrfs_root *root, struct extent_buffer *dst,
32 struct extent_buffer *src);
33static int balance_node_right(struct btrfs_trans_handle *trans,
34 struct btrfs_root *root,
35 struct extent_buffer *dst_buf,
36 struct extent_buffer *src_buf);
Chris Masone089f052007-03-16 16:20:31 -040037static int del_ptr(struct btrfs_trans_handle *trans, struct btrfs_root *root,
38 struct btrfs_path *path, int level, int slot);
Chris Masond97e63b2007-02-20 16:40:44 -050039
Chris Masondf24a2b2007-04-04 09:36:31 -040040inline void btrfs_init_path(struct btrfs_path *p)
41{
42 memset(p, 0, sizeof(*p));
43}
44
Chris Mason2c90e5d2007-04-02 10:50:19 -040045struct btrfs_path *btrfs_alloc_path(void)
46{
Chris Masondf24a2b2007-04-04 09:36:31 -040047 struct btrfs_path *path;
48 path = kmem_cache_alloc(btrfs_path_cachep, GFP_NOFS);
Chris Mason2cc58cf2007-08-27 16:49:44 -040049 if (path) {
Chris Masondf24a2b2007-04-04 09:36:31 -040050 btrfs_init_path(path);
Chris Mason2cc58cf2007-08-27 16:49:44 -040051 path->reada = 1;
52 }
Chris Masondf24a2b2007-04-04 09:36:31 -040053 return path;
Chris Mason2c90e5d2007-04-02 10:50:19 -040054}
55
56void btrfs_free_path(struct btrfs_path *p)
57{
Chris Masondf24a2b2007-04-04 09:36:31 -040058 btrfs_release_path(NULL, p);
Chris Mason2c90e5d2007-04-02 10:50:19 -040059 kmem_cache_free(btrfs_path_cachep, p);
60}
61
Chris Mason234b63a2007-03-13 10:46:10 -040062void btrfs_release_path(struct btrfs_root *root, struct btrfs_path *p)
Chris Masoneb60cea2007-02-02 09:18:22 -050063{
64 int i;
Chris Mason234b63a2007-03-13 10:46:10 -040065 for (i = 0; i < BTRFS_MAX_LEVEL; i++) {
Chris Masoneb60cea2007-02-02 09:18:22 -050066 if (!p->nodes[i])
67 break;
Chris Mason5f39d392007-10-15 16:14:19 -040068 free_extent_buffer(p->nodes[i]);
Chris Masoneb60cea2007-02-02 09:18:22 -050069 }
Chris Masonaa5d6be2007-02-28 16:35:06 -050070 memset(p, 0, sizeof(*p));
Chris Masoneb60cea2007-02-02 09:18:22 -050071}
72
Chris Mason5f39d392007-10-15 16:14:19 -040073static int __btrfs_cow_block(struct btrfs_trans_handle *trans,
74 struct btrfs_root *root,
75 struct extent_buffer *buf,
76 struct extent_buffer *parent, int parent_slot,
77 struct extent_buffer **cow_ret,
78 u64 search_start, u64 empty_size)
Chris Mason6702ed42007-08-07 16:15:09 -040079{
Chris Mason7bb86312007-12-11 09:25:06 -050080 u64 root_gen;
Chris Mason5f39d392007-10-15 16:14:19 -040081 struct extent_buffer *cow;
Chris Mason7bb86312007-12-11 09:25:06 -050082 u32 nritems;
Chris Mason6702ed42007-08-07 16:15:09 -040083 int ret = 0;
84 int different_trans = 0;
Chris Mason7bb86312007-12-11 09:25:06 -050085 int level;
86 struct btrfs_key first_key;
Chris Mason6702ed42007-08-07 16:15:09 -040087
Chris Mason7bb86312007-12-11 09:25:06 -050088 if (root->ref_cows) {
89 root_gen = trans->transid;
90 } else {
91 root_gen = 0;
92 }
93
94 WARN_ON(root->ref_cows && trans->transid !=
95 root->fs_info->running_transaction->transid);
Chris Mason6702ed42007-08-07 16:15:09 -040096 WARN_ON(root->ref_cows && trans->transid != root->last_trans);
Chris Mason5f39d392007-10-15 16:14:19 -040097
Chris Mason7bb86312007-12-11 09:25:06 -050098 level = btrfs_header_level(buf);
99 nritems = btrfs_header_nritems(buf);
100 if (nritems) {
101 if (level == 0)
102 btrfs_item_key_to_cpu(buf, &first_key, 0);
103 else
104 btrfs_node_key_to_cpu(buf, &first_key, 0);
105 } else {
106 first_key.objectid = 0;
107 }
108 cow = __btrfs_alloc_free_block(trans, root, buf->len,
109 root->root_key.objectid,
110 root_gen, first_key.objectid, level,
Chris Masondb945352007-10-15 16:15:53 -0400111 search_start, empty_size);
Chris Mason6702ed42007-08-07 16:15:09 -0400112 if (IS_ERR(cow))
113 return PTR_ERR(cow);
114
Chris Mason5f39d392007-10-15 16:14:19 -0400115 copy_extent_buffer(cow, buf, 0, 0, cow->len);
Chris Masondb945352007-10-15 16:15:53 -0400116 btrfs_set_header_bytenr(cow, cow->start);
Chris Mason5f39d392007-10-15 16:14:19 -0400117 btrfs_set_header_generation(cow, trans->transid);
118 btrfs_set_header_owner(cow, root->root_key.objectid);
Chris Mason6702ed42007-08-07 16:15:09 -0400119
Chris Mason5f39d392007-10-15 16:14:19 -0400120 WARN_ON(btrfs_header_generation(buf) > trans->transid);
121 if (btrfs_header_generation(buf) != trans->transid) {
Chris Mason6702ed42007-08-07 16:15:09 -0400122 different_trans = 1;
123 ret = btrfs_inc_ref(trans, root, buf);
124 if (ret)
125 return ret;
126 } else {
Chris Mason6702ed42007-08-07 16:15:09 -0400127 clean_tree_block(trans, root, buf);
128 }
129
130 if (buf == root->node) {
Chris Mason7bb86312007-12-11 09:25:06 -0500131 root_gen = btrfs_header_generation(buf);
Chris Mason6702ed42007-08-07 16:15:09 -0400132 root->node = cow;
Chris Mason5f39d392007-10-15 16:14:19 -0400133 extent_buffer_get(cow);
Chris Mason6702ed42007-08-07 16:15:09 -0400134 if (buf != root->commit_root) {
Chris Masondb945352007-10-15 16:15:53 -0400135 btrfs_free_extent(trans, root, buf->start,
Chris Mason7bb86312007-12-11 09:25:06 -0500136 buf->len, root->root_key.objectid,
137 root_gen, 0, 0, 1);
Chris Mason6702ed42007-08-07 16:15:09 -0400138 }
Chris Mason5f39d392007-10-15 16:14:19 -0400139 free_extent_buffer(buf);
Chris Mason6702ed42007-08-07 16:15:09 -0400140 } else {
Chris Mason7bb86312007-12-11 09:25:06 -0500141 root_gen = btrfs_header_generation(parent);
Chris Mason5f39d392007-10-15 16:14:19 -0400142 btrfs_set_node_blockptr(parent, parent_slot,
Chris Masondb945352007-10-15 16:15:53 -0400143 cow->start);
Chris Mason74493f72007-12-11 09:25:06 -0500144 WARN_ON(trans->transid == 0);
145 btrfs_set_node_ptr_generation(parent, parent_slot,
146 trans->transid);
Chris Mason6702ed42007-08-07 16:15:09 -0400147 btrfs_mark_buffer_dirty(parent);
Chris Mason5f39d392007-10-15 16:14:19 -0400148 WARN_ON(btrfs_header_generation(parent) != trans->transid);
Chris Mason7bb86312007-12-11 09:25:06 -0500149 btrfs_free_extent(trans, root, buf->start, buf->len,
150 btrfs_header_owner(parent), root_gen,
151 0, 0, 1);
Chris Mason6702ed42007-08-07 16:15:09 -0400152 }
Chris Mason5f39d392007-10-15 16:14:19 -0400153 free_extent_buffer(buf);
Chris Mason6702ed42007-08-07 16:15:09 -0400154 btrfs_mark_buffer_dirty(cow);
155 *cow_ret = cow;
156 return 0;
157}
158
Chris Mason5f39d392007-10-15 16:14:19 -0400159int btrfs_cow_block(struct btrfs_trans_handle *trans,
160 struct btrfs_root *root, struct extent_buffer *buf,
161 struct extent_buffer *parent, int parent_slot,
162 struct extent_buffer **cow_ret)
Chris Mason02217ed2007-03-02 16:08:05 -0500163{
Chris Mason6702ed42007-08-07 16:15:09 -0400164 u64 search_start;
Chris Masonf510cfe2007-10-15 16:14:48 -0400165 int ret;
Chris Masonccd467d2007-06-28 15:57:36 -0400166 if (trans->transaction != root->fs_info->running_transaction) {
167 printk(KERN_CRIT "trans %Lu running %Lu\n", trans->transid,
168 root->fs_info->running_transaction->transid);
169 WARN_ON(1);
170 }
171 if (trans->transid != root->fs_info->generation) {
172 printk(KERN_CRIT "trans %Lu running %Lu\n", trans->transid,
173 root->fs_info->generation);
174 WARN_ON(1);
175 }
Chris Mason5f39d392007-10-15 16:14:19 -0400176 if (btrfs_header_generation(buf) == trans->transid) {
Chris Mason02217ed2007-03-02 16:08:05 -0500177 *cow_ret = buf;
178 return 0;
179 }
Chris Mason6702ed42007-08-07 16:15:09 -0400180
Chris Masondb945352007-10-15 16:15:53 -0400181 search_start = buf->start & ~((u64)BTRFS_BLOCK_GROUP_SIZE - 1);
Chris Masonf510cfe2007-10-15 16:14:48 -0400182 ret = __btrfs_cow_block(trans, root, buf, parent,
Chris Mason6702ed42007-08-07 16:15:09 -0400183 parent_slot, cow_ret, search_start, 0);
Chris Masonf510cfe2007-10-15 16:14:48 -0400184 return ret;
Chris Mason6702ed42007-08-07 16:15:09 -0400185}
186
Chris Mason6b800532007-10-15 16:17:34 -0400187static int close_blocks(u64 blocknr, u64 other, u32 blocksize)
Chris Mason6702ed42007-08-07 16:15:09 -0400188{
Chris Mason6b800532007-10-15 16:17:34 -0400189 if (blocknr < other && other - (blocknr + blocksize) < 32768)
Chris Mason6702ed42007-08-07 16:15:09 -0400190 return 1;
Chris Mason6b800532007-10-15 16:17:34 -0400191 if (blocknr > other && blocknr - (other + blocksize) < 32768)
Chris Mason6702ed42007-08-07 16:15:09 -0400192 return 1;
Chris Mason02217ed2007-03-02 16:08:05 -0500193 return 0;
194}
195
Chris Mason081e9572007-11-06 10:26:24 -0500196/*
197 * compare two keys in a memcmp fashion
198 */
199static int comp_keys(struct btrfs_disk_key *disk, struct btrfs_key *k2)
200{
201 struct btrfs_key k1;
202
203 btrfs_disk_key_to_cpu(&k1, disk);
204
205 if (k1.objectid > k2->objectid)
206 return 1;
207 if (k1.objectid < k2->objectid)
208 return -1;
209 if (k1.type > k2->type)
210 return 1;
211 if (k1.type < k2->type)
212 return -1;
213 if (k1.offset > k2->offset)
214 return 1;
215 if (k1.offset < k2->offset)
216 return -1;
217 return 0;
218}
219
220
Chris Mason6702ed42007-08-07 16:15:09 -0400221int btrfs_realloc_node(struct btrfs_trans_handle *trans,
Chris Mason5f39d392007-10-15 16:14:19 -0400222 struct btrfs_root *root, struct extent_buffer *parent,
Chris Masona6b6e752007-10-15 16:22:39 -0400223 int start_slot, int cache_only, u64 *last_ret,
224 struct btrfs_key *progress)
Chris Mason6702ed42007-08-07 16:15:09 -0400225{
Chris Mason6b800532007-10-15 16:17:34 -0400226 struct extent_buffer *cur;
227 struct extent_buffer *tmp;
Chris Mason6702ed42007-08-07 16:15:09 -0400228 u64 blocknr;
Chris Masone9d0b132007-08-10 14:06:19 -0400229 u64 search_start = *last_ret;
230 u64 last_block = 0;
Chris Mason6702ed42007-08-07 16:15:09 -0400231 u64 other;
232 u32 parent_nritems;
Chris Mason6702ed42007-08-07 16:15:09 -0400233 int end_slot;
234 int i;
235 int err = 0;
Chris Masonf2183bd2007-08-10 14:42:37 -0400236 int parent_level;
Chris Mason6b800532007-10-15 16:17:34 -0400237 int uptodate;
238 u32 blocksize;
Chris Mason081e9572007-11-06 10:26:24 -0500239 int progress_passed = 0;
240 struct btrfs_disk_key disk_key;
Chris Mason6702ed42007-08-07 16:15:09 -0400241
Chris Mason5708b952007-10-25 15:43:18 -0400242 parent_level = btrfs_header_level(parent);
243 if (cache_only && parent_level != 1)
244 return 0;
245
Chris Mason6702ed42007-08-07 16:15:09 -0400246 if (trans->transaction != root->fs_info->running_transaction) {
247 printk(KERN_CRIT "trans %Lu running %Lu\n", trans->transid,
248 root->fs_info->running_transaction->transid);
249 WARN_ON(1);
250 }
251 if (trans->transid != root->fs_info->generation) {
252 printk(KERN_CRIT "trans %Lu running %Lu\n", trans->transid,
253 root->fs_info->generation);
254 WARN_ON(1);
255 }
Chris Mason86479a02007-09-10 19:58:16 -0400256
Chris Mason6b800532007-10-15 16:17:34 -0400257 parent_nritems = btrfs_header_nritems(parent);
Chris Mason6b800532007-10-15 16:17:34 -0400258 blocksize = btrfs_level_size(root, parent_level - 1);
Chris Mason6702ed42007-08-07 16:15:09 -0400259 end_slot = parent_nritems;
260
261 if (parent_nritems == 1)
262 return 0;
263
264 for (i = start_slot; i < end_slot; i++) {
265 int close = 1;
Chris Masona6b6e752007-10-15 16:22:39 -0400266
Chris Mason5708b952007-10-25 15:43:18 -0400267 if (!parent->map_token) {
268 map_extent_buffer(parent,
269 btrfs_node_key_ptr_offset(i),
270 sizeof(struct btrfs_key_ptr),
271 &parent->map_token, &parent->kaddr,
272 &parent->map_start, &parent->map_len,
273 KM_USER1);
274 }
Chris Mason081e9572007-11-06 10:26:24 -0500275 btrfs_node_key(parent, &disk_key, i);
276 if (!progress_passed && comp_keys(&disk_key, progress) < 0)
277 continue;
278
279 progress_passed = 1;
Chris Mason6b800532007-10-15 16:17:34 -0400280 blocknr = btrfs_node_blockptr(parent, i);
Chris Masone9d0b132007-08-10 14:06:19 -0400281 if (last_block == 0)
282 last_block = blocknr;
Chris Mason5708b952007-10-25 15:43:18 -0400283
Chris Mason6702ed42007-08-07 16:15:09 -0400284 if (i > 0) {
Chris Mason6b800532007-10-15 16:17:34 -0400285 other = btrfs_node_blockptr(parent, i - 1);
286 close = close_blocks(blocknr, other, blocksize);
Chris Mason6702ed42007-08-07 16:15:09 -0400287 }
Chris Mason5708b952007-10-25 15:43:18 -0400288 if (close && i < end_slot - 2) {
Chris Mason6b800532007-10-15 16:17:34 -0400289 other = btrfs_node_blockptr(parent, i + 1);
290 close = close_blocks(blocknr, other, blocksize);
Chris Mason6702ed42007-08-07 16:15:09 -0400291 }
Chris Masone9d0b132007-08-10 14:06:19 -0400292 if (close) {
293 last_block = blocknr;
Chris Mason6702ed42007-08-07 16:15:09 -0400294 continue;
Chris Masone9d0b132007-08-10 14:06:19 -0400295 }
Chris Mason5708b952007-10-25 15:43:18 -0400296 if (parent->map_token) {
297 unmap_extent_buffer(parent, parent->map_token,
298 KM_USER1);
299 parent->map_token = NULL;
300 }
Chris Mason6702ed42007-08-07 16:15:09 -0400301
Chris Mason6b800532007-10-15 16:17:34 -0400302 cur = btrfs_find_tree_block(root, blocknr, blocksize);
303 if (cur)
304 uptodate = btrfs_buffer_uptodate(cur);
305 else
306 uptodate = 0;
Chris Mason5708b952007-10-25 15:43:18 -0400307 if (!cur || !uptodate) {
Chris Mason6702ed42007-08-07 16:15:09 -0400308 if (cache_only) {
Chris Mason6b800532007-10-15 16:17:34 -0400309 free_extent_buffer(cur);
Chris Mason6702ed42007-08-07 16:15:09 -0400310 continue;
311 }
Chris Mason6b800532007-10-15 16:17:34 -0400312 if (!cur) {
313 cur = read_tree_block(root, blocknr,
314 blocksize);
315 } else if (!uptodate) {
316 btrfs_read_buffer(cur);
Chris Masonf2183bd2007-08-10 14:42:37 -0400317 }
Chris Mason6702ed42007-08-07 16:15:09 -0400318 }
Chris Masone9d0b132007-08-10 14:06:19 -0400319 if (search_start == 0)
Chris Mason6b800532007-10-15 16:17:34 -0400320 search_start = last_block;
Chris Masone9d0b132007-08-10 14:06:19 -0400321
Chris Mason6b800532007-10-15 16:17:34 -0400322 err = __btrfs_cow_block(trans, root, cur, parent, i,
323 &tmp, search_start,
324 min(16 * blocksize,
325 (end_slot - i) * blocksize));
Yan252c38f2007-08-29 09:11:44 -0400326 if (err) {
Chris Mason6b800532007-10-15 16:17:34 -0400327 free_extent_buffer(cur);
Chris Mason6702ed42007-08-07 16:15:09 -0400328 break;
Yan252c38f2007-08-29 09:11:44 -0400329 }
Chris Mason6b800532007-10-15 16:17:34 -0400330 search_start = tmp->start;
Chris Mason5708b952007-10-25 15:43:18 -0400331 last_block = tmp->start;
Chris Masonf2183bd2007-08-10 14:42:37 -0400332 *last_ret = search_start;
333 if (parent_level == 1)
Chris Mason6b800532007-10-15 16:17:34 -0400334 btrfs_clear_buffer_defrag(tmp);
Chris Mason6b800532007-10-15 16:17:34 -0400335 free_extent_buffer(tmp);
Chris Mason6702ed42007-08-07 16:15:09 -0400336 }
Chris Mason5708b952007-10-25 15:43:18 -0400337 if (parent->map_token) {
338 unmap_extent_buffer(parent, parent->map_token,
339 KM_USER1);
340 parent->map_token = NULL;
341 }
Chris Mason6702ed42007-08-07 16:15:09 -0400342 return err;
343}
344
Chris Mason74123bd2007-02-02 11:05:29 -0500345/*
346 * The leaf data grows from end-to-front in the node.
347 * this returns the address of the start of the last item,
348 * which is the stop of the leaf data stack
349 */
Chris Mason123abc82007-03-14 14:14:43 -0400350static inline unsigned int leaf_data_end(struct btrfs_root *root,
Chris Mason5f39d392007-10-15 16:14:19 -0400351 struct extent_buffer *leaf)
Chris Masonbe0e5c02007-01-26 15:51:26 -0500352{
Chris Mason5f39d392007-10-15 16:14:19 -0400353 u32 nr = btrfs_header_nritems(leaf);
Chris Masonbe0e5c02007-01-26 15:51:26 -0500354 if (nr == 0)
Chris Mason123abc82007-03-14 14:14:43 -0400355 return BTRFS_LEAF_DATA_SIZE(root);
Chris Mason5f39d392007-10-15 16:14:19 -0400356 return btrfs_item_offset_nr(leaf, nr - 1);
Chris Masonbe0e5c02007-01-26 15:51:26 -0500357}
358
Chris Mason123abc82007-03-14 14:14:43 -0400359static int check_node(struct btrfs_root *root, struct btrfs_path *path,
360 int level)
Chris Masonaa5d6be2007-02-28 16:35:06 -0500361{
Chris Mason5f39d392007-10-15 16:14:19 -0400362 struct extent_buffer *parent = NULL;
363 struct extent_buffer *node = path->nodes[level];
364 struct btrfs_disk_key parent_key;
365 struct btrfs_disk_key node_key;
Chris Masonaa5d6be2007-02-28 16:35:06 -0500366 int parent_slot;
Chris Mason8d7be552007-05-10 11:24:42 -0400367 int slot;
368 struct btrfs_key cpukey;
Chris Mason5f39d392007-10-15 16:14:19 -0400369 u32 nritems = btrfs_header_nritems(node);
Chris Masonaa5d6be2007-02-28 16:35:06 -0500370
371 if (path->nodes[level + 1])
Chris Mason5f39d392007-10-15 16:14:19 -0400372 parent = path->nodes[level + 1];
Aneesha1f39632007-07-11 10:03:27 -0400373
Chris Mason8d7be552007-05-10 11:24:42 -0400374 slot = path->slots[level];
Chris Mason7518a232007-03-12 12:01:18 -0400375 BUG_ON(nritems == 0);
376 if (parent) {
Aneesha1f39632007-07-11 10:03:27 -0400377 parent_slot = path->slots[level + 1];
Chris Mason5f39d392007-10-15 16:14:19 -0400378 btrfs_node_key(parent, &parent_key, parent_slot);
379 btrfs_node_key(node, &node_key, 0);
380 BUG_ON(memcmp(&parent_key, &node_key,
Chris Masone2fa7222007-03-12 16:22:34 -0400381 sizeof(struct btrfs_disk_key)));
Chris Mason1d4f8a02007-03-13 09:28:32 -0400382 BUG_ON(btrfs_node_blockptr(parent, parent_slot) !=
Chris Masondb945352007-10-15 16:15:53 -0400383 btrfs_header_bytenr(node));
Chris Masonaa5d6be2007-02-28 16:35:06 -0500384 }
Chris Mason123abc82007-03-14 14:14:43 -0400385 BUG_ON(nritems > BTRFS_NODEPTRS_PER_BLOCK(root));
Chris Mason8d7be552007-05-10 11:24:42 -0400386 if (slot != 0) {
Chris Mason5f39d392007-10-15 16:14:19 -0400387 btrfs_node_key_to_cpu(node, &cpukey, slot - 1);
388 btrfs_node_key(node, &node_key, slot);
389 BUG_ON(comp_keys(&node_key, &cpukey) <= 0);
Chris Mason8d7be552007-05-10 11:24:42 -0400390 }
391 if (slot < nritems - 1) {
Chris Mason5f39d392007-10-15 16:14:19 -0400392 btrfs_node_key_to_cpu(node, &cpukey, slot + 1);
393 btrfs_node_key(node, &node_key, slot);
394 BUG_ON(comp_keys(&node_key, &cpukey) >= 0);
Chris Masonaa5d6be2007-02-28 16:35:06 -0500395 }
396 return 0;
397}
398
Chris Mason123abc82007-03-14 14:14:43 -0400399static int check_leaf(struct btrfs_root *root, struct btrfs_path *path,
400 int level)
Chris Masonaa5d6be2007-02-28 16:35:06 -0500401{
Chris Mason5f39d392007-10-15 16:14:19 -0400402 struct extent_buffer *leaf = path->nodes[level];
403 struct extent_buffer *parent = NULL;
Chris Masonaa5d6be2007-02-28 16:35:06 -0500404 int parent_slot;
Chris Mason8d7be552007-05-10 11:24:42 -0400405 struct btrfs_key cpukey;
Chris Mason5f39d392007-10-15 16:14:19 -0400406 struct btrfs_disk_key parent_key;
407 struct btrfs_disk_key leaf_key;
408 int slot = path->slots[0];
Chris Mason8d7be552007-05-10 11:24:42 -0400409
Chris Mason5f39d392007-10-15 16:14:19 -0400410 u32 nritems = btrfs_header_nritems(leaf);
Chris Masonaa5d6be2007-02-28 16:35:06 -0500411
412 if (path->nodes[level + 1])
Chris Mason5f39d392007-10-15 16:14:19 -0400413 parent = path->nodes[level + 1];
Chris Mason7518a232007-03-12 12:01:18 -0400414
415 if (nritems == 0)
416 return 0;
417
418 if (parent) {
Aneesha1f39632007-07-11 10:03:27 -0400419 parent_slot = path->slots[level + 1];
Chris Mason5f39d392007-10-15 16:14:19 -0400420 btrfs_node_key(parent, &parent_key, parent_slot);
421 btrfs_item_key(leaf, &leaf_key, 0);
Chris Mason6702ed42007-08-07 16:15:09 -0400422
Chris Mason5f39d392007-10-15 16:14:19 -0400423 BUG_ON(memcmp(&parent_key, &leaf_key,
Chris Masone2fa7222007-03-12 16:22:34 -0400424 sizeof(struct btrfs_disk_key)));
Chris Mason1d4f8a02007-03-13 09:28:32 -0400425 BUG_ON(btrfs_node_blockptr(parent, parent_slot) !=
Chris Masondb945352007-10-15 16:15:53 -0400426 btrfs_header_bytenr(leaf));
Chris Masonaa5d6be2007-02-28 16:35:06 -0500427 }
Chris Mason5f39d392007-10-15 16:14:19 -0400428#if 0
429 for (i = 0; nritems > 1 && i < nritems - 2; i++) {
430 btrfs_item_key_to_cpu(leaf, &cpukey, i + 1);
431 btrfs_item_key(leaf, &leaf_key, i);
432 if (comp_keys(&leaf_key, &cpukey) >= 0) {
433 btrfs_print_leaf(root, leaf);
434 printk("slot %d offset bad key\n", i);
435 BUG_ON(1);
436 }
437 if (btrfs_item_offset_nr(leaf, i) !=
438 btrfs_item_end_nr(leaf, i + 1)) {
439 btrfs_print_leaf(root, leaf);
440 printk("slot %d offset bad\n", i);
441 BUG_ON(1);
442 }
443 if (i == 0) {
444 if (btrfs_item_offset_nr(leaf, i) +
445 btrfs_item_size_nr(leaf, i) !=
446 BTRFS_LEAF_DATA_SIZE(root)) {
447 btrfs_print_leaf(root, leaf);
448 printk("slot %d first offset bad\n", i);
449 BUG_ON(1);
450 }
451 }
452 }
453 if (nritems > 0) {
454 if (btrfs_item_size_nr(leaf, nritems - 1) > 4096) {
455 btrfs_print_leaf(root, leaf);
456 printk("slot %d bad size \n", nritems - 1);
457 BUG_ON(1);
458 }
459 }
460#endif
461 if (slot != 0 && slot < nritems - 1) {
462 btrfs_item_key(leaf, &leaf_key, slot);
463 btrfs_item_key_to_cpu(leaf, &cpukey, slot - 1);
464 if (comp_keys(&leaf_key, &cpukey) <= 0) {
465 btrfs_print_leaf(root, leaf);
466 printk("slot %d offset bad key\n", slot);
467 BUG_ON(1);
468 }
469 if (btrfs_item_offset_nr(leaf, slot - 1) !=
470 btrfs_item_end_nr(leaf, slot)) {
471 btrfs_print_leaf(root, leaf);
472 printk("slot %d offset bad\n", slot);
473 BUG_ON(1);
474 }
Chris Masonaa5d6be2007-02-28 16:35:06 -0500475 }
Chris Mason8d7be552007-05-10 11:24:42 -0400476 if (slot < nritems - 1) {
Chris Mason5f39d392007-10-15 16:14:19 -0400477 btrfs_item_key(leaf, &leaf_key, slot);
478 btrfs_item_key_to_cpu(leaf, &cpukey, slot + 1);
479 BUG_ON(comp_keys(&leaf_key, &cpukey) >= 0);
480 if (btrfs_item_offset_nr(leaf, slot) !=
481 btrfs_item_end_nr(leaf, slot + 1)) {
482 btrfs_print_leaf(root, leaf);
483 printk("slot %d offset bad\n", slot);
484 BUG_ON(1);
485 }
Chris Mason8d7be552007-05-10 11:24:42 -0400486 }
Chris Mason5f39d392007-10-15 16:14:19 -0400487 BUG_ON(btrfs_item_offset_nr(leaf, 0) +
488 btrfs_item_size_nr(leaf, 0) != BTRFS_LEAF_DATA_SIZE(root));
Chris Masonaa5d6be2007-02-28 16:35:06 -0500489 return 0;
490}
491
Chris Mason123abc82007-03-14 14:14:43 -0400492static int check_block(struct btrfs_root *root, struct btrfs_path *path,
493 int level)
Chris Masonaa5d6be2007-02-28 16:35:06 -0500494{
Chris Mason810191f2007-10-15 16:18:55 -0400495 return 0;
Chris Masondb945352007-10-15 16:15:53 -0400496#if 0
Chris Mason5f39d392007-10-15 16:14:19 -0400497 struct extent_buffer *buf = path->nodes[level];
Chris Mason5f39d392007-10-15 16:14:19 -0400498
Chris Mason479965d2007-10-15 16:14:27 -0400499 if (memcmp_extent_buffer(buf, root->fs_info->fsid,
500 (unsigned long)btrfs_header_fsid(buf),
501 BTRFS_FSID_SIZE)) {
Chris Mason5f39d392007-10-15 16:14:19 -0400502 printk("warning bad block %Lu\n", buf->start);
Chris Masondb945352007-10-15 16:15:53 -0400503 return 1;
Chris Mason5f39d392007-10-15 16:14:19 -0400504 }
Chris Masondb945352007-10-15 16:15:53 -0400505#endif
Chris Masonaa5d6be2007-02-28 16:35:06 -0500506 if (level == 0)
Chris Mason123abc82007-03-14 14:14:43 -0400507 return check_leaf(root, path, level);
508 return check_node(root, path, level);
Chris Masonaa5d6be2007-02-28 16:35:06 -0500509}
510
Chris Mason74123bd2007-02-02 11:05:29 -0500511/*
Chris Mason5f39d392007-10-15 16:14:19 -0400512 * search for key in the extent_buffer. The items start at offset p,
513 * and they are item_size apart. There are 'max' items in p.
514 *
Chris Mason74123bd2007-02-02 11:05:29 -0500515 * the slot in the array is returned via slot, and it points to
516 * the place where you would insert key if it is not found in
517 * the array.
518 *
519 * slot may point to max if the key is bigger than all of the keys
520 */
Chris Mason5f39d392007-10-15 16:14:19 -0400521static int generic_bin_search(struct extent_buffer *eb, unsigned long p,
522 int item_size, struct btrfs_key *key,
523 int max, int *slot)
Chris Masonbe0e5c02007-01-26 15:51:26 -0500524{
525 int low = 0;
526 int high = max;
527 int mid;
528 int ret;
Chris Mason479965d2007-10-15 16:14:27 -0400529 struct btrfs_disk_key *tmp = NULL;
Chris Mason5f39d392007-10-15 16:14:19 -0400530 struct btrfs_disk_key unaligned;
531 unsigned long offset;
532 char *map_token = NULL;
533 char *kaddr = NULL;
534 unsigned long map_start = 0;
535 unsigned long map_len = 0;
Chris Mason479965d2007-10-15 16:14:27 -0400536 int err;
Chris Masonbe0e5c02007-01-26 15:51:26 -0500537
538 while(low < high) {
539 mid = (low + high) / 2;
Chris Mason5f39d392007-10-15 16:14:19 -0400540 offset = p + mid * item_size;
541
542 if (!map_token || offset < map_start ||
543 (offset + sizeof(struct btrfs_disk_key)) >
544 map_start + map_len) {
Chris Mason479965d2007-10-15 16:14:27 -0400545 if (map_token) {
Chris Mason5f39d392007-10-15 16:14:19 -0400546 unmap_extent_buffer(eb, map_token, KM_USER0);
Chris Mason479965d2007-10-15 16:14:27 -0400547 map_token = NULL;
548 }
549 err = map_extent_buffer(eb, offset,
550 sizeof(struct btrfs_disk_key),
551 &map_token, &kaddr,
552 &map_start, &map_len, KM_USER0);
Chris Mason5f39d392007-10-15 16:14:19 -0400553
Chris Mason479965d2007-10-15 16:14:27 -0400554 if (!err) {
555 tmp = (struct btrfs_disk_key *)(kaddr + offset -
556 map_start);
557 } else {
558 read_extent_buffer(eb, &unaligned,
559 offset, sizeof(unaligned));
560 tmp = &unaligned;
561 }
562
Chris Mason5f39d392007-10-15 16:14:19 -0400563 } else {
564 tmp = (struct btrfs_disk_key *)(kaddr + offset -
565 map_start);
566 }
Chris Masonbe0e5c02007-01-26 15:51:26 -0500567 ret = comp_keys(tmp, key);
568
569 if (ret < 0)
570 low = mid + 1;
571 else if (ret > 0)
572 high = mid;
573 else {
574 *slot = mid;
Chris Mason479965d2007-10-15 16:14:27 -0400575 if (map_token)
576 unmap_extent_buffer(eb, map_token, KM_USER0);
Chris Masonbe0e5c02007-01-26 15:51:26 -0500577 return 0;
578 }
579 }
580 *slot = low;
Chris Mason5f39d392007-10-15 16:14:19 -0400581 if (map_token)
582 unmap_extent_buffer(eb, map_token, KM_USER0);
Chris Masonbe0e5c02007-01-26 15:51:26 -0500583 return 1;
584}
585
Chris Mason97571fd2007-02-24 13:39:08 -0500586/*
587 * simple bin_search frontend that does the right thing for
588 * leaves vs nodes
589 */
Chris Mason5f39d392007-10-15 16:14:19 -0400590static int bin_search(struct extent_buffer *eb, struct btrfs_key *key,
591 int level, int *slot)
Chris Masonbe0e5c02007-01-26 15:51:26 -0500592{
Chris Mason5f39d392007-10-15 16:14:19 -0400593 if (level == 0) {
594 return generic_bin_search(eb,
595 offsetof(struct btrfs_leaf, items),
Chris Mason0783fcf2007-03-12 20:12:07 -0400596 sizeof(struct btrfs_item),
Chris Mason5f39d392007-10-15 16:14:19 -0400597 key, btrfs_header_nritems(eb),
Chris Mason7518a232007-03-12 12:01:18 -0400598 slot);
Chris Masonbe0e5c02007-01-26 15:51:26 -0500599 } else {
Chris Mason5f39d392007-10-15 16:14:19 -0400600 return generic_bin_search(eb,
601 offsetof(struct btrfs_node, ptrs),
Chris Mason123abc82007-03-14 14:14:43 -0400602 sizeof(struct btrfs_key_ptr),
Chris Mason5f39d392007-10-15 16:14:19 -0400603 key, btrfs_header_nritems(eb),
Chris Mason7518a232007-03-12 12:01:18 -0400604 slot);
Chris Masonbe0e5c02007-01-26 15:51:26 -0500605 }
606 return -1;
607}
608
Chris Mason5f39d392007-10-15 16:14:19 -0400609static struct extent_buffer *read_node_slot(struct btrfs_root *root,
610 struct extent_buffer *parent, int slot)
Chris Masonbb803952007-03-01 12:04:21 -0500611{
Chris Masonbb803952007-03-01 12:04:21 -0500612 if (slot < 0)
613 return NULL;
Chris Mason5f39d392007-10-15 16:14:19 -0400614 if (slot >= btrfs_header_nritems(parent))
Chris Masonbb803952007-03-01 12:04:21 -0500615 return NULL;
Chris Masondb945352007-10-15 16:15:53 -0400616 return read_tree_block(root, btrfs_node_blockptr(parent, slot),
617 btrfs_level_size(root, btrfs_header_level(parent) - 1));
Chris Masonbb803952007-03-01 12:04:21 -0500618}
619
Chris Masone089f052007-03-16 16:20:31 -0400620static int balance_level(struct btrfs_trans_handle *trans, struct btrfs_root
621 *root, struct btrfs_path *path, int level)
Chris Masonbb803952007-03-01 12:04:21 -0500622{
Chris Mason5f39d392007-10-15 16:14:19 -0400623 struct extent_buffer *right = NULL;
624 struct extent_buffer *mid;
625 struct extent_buffer *left = NULL;
626 struct extent_buffer *parent = NULL;
Chris Masonbb803952007-03-01 12:04:21 -0500627 int ret = 0;
628 int wret;
629 int pslot;
Chris Masonbb803952007-03-01 12:04:21 -0500630 int orig_slot = path->slots[level];
Chris Mason54aa1f42007-06-22 14:16:25 -0400631 int err_on_enospc = 0;
Chris Mason79f95c82007-03-01 15:16:26 -0500632 u64 orig_ptr;
Chris Masonbb803952007-03-01 12:04:21 -0500633
634 if (level == 0)
635 return 0;
636
Chris Mason5f39d392007-10-15 16:14:19 -0400637 mid = path->nodes[level];
Chris Mason7bb86312007-12-11 09:25:06 -0500638 WARN_ON(btrfs_header_generation(mid) != trans->transid);
639
Chris Mason1d4f8a02007-03-13 09:28:32 -0400640 orig_ptr = btrfs_node_blockptr(mid, orig_slot);
Chris Mason79f95c82007-03-01 15:16:26 -0500641
Chris Mason234b63a2007-03-13 10:46:10 -0400642 if (level < BTRFS_MAX_LEVEL - 1)
Chris Mason5f39d392007-10-15 16:14:19 -0400643 parent = path->nodes[level + 1];
Chris Masonbb803952007-03-01 12:04:21 -0500644 pslot = path->slots[level + 1];
645
Chris Mason40689472007-03-17 14:29:23 -0400646 /*
647 * deal with the case where there is only one pointer in the root
648 * by promoting the node below to a root
649 */
Chris Mason5f39d392007-10-15 16:14:19 -0400650 if (!parent) {
651 struct extent_buffer *child;
Chris Masonbb803952007-03-01 12:04:21 -0500652
Chris Mason5f39d392007-10-15 16:14:19 -0400653 if (btrfs_header_nritems(mid) != 1)
Chris Masonbb803952007-03-01 12:04:21 -0500654 return 0;
655
656 /* promote the child to a root */
Chris Mason5f39d392007-10-15 16:14:19 -0400657 child = read_node_slot(root, mid, 0);
Chris Masonbb803952007-03-01 12:04:21 -0500658 BUG_ON(!child);
659 root->node = child;
660 path->nodes[level] = NULL;
Chris Mason5f39d392007-10-15 16:14:19 -0400661 clean_tree_block(trans, root, mid);
662 wait_on_tree_block_writeback(root, mid);
Chris Masonbb803952007-03-01 12:04:21 -0500663 /* once for the path */
Chris Mason5f39d392007-10-15 16:14:19 -0400664 free_extent_buffer(mid);
Chris Mason7bb86312007-12-11 09:25:06 -0500665 ret = btrfs_free_extent(trans, root, mid->start, mid->len,
666 root->root_key.objectid,
667 btrfs_header_generation(mid), 0, 0, 1);
Chris Masonbb803952007-03-01 12:04:21 -0500668 /* once for the root ptr */
Chris Mason5f39d392007-10-15 16:14:19 -0400669 free_extent_buffer(mid);
Chris Masondb945352007-10-15 16:15:53 -0400670 return ret;
Chris Masonbb803952007-03-01 12:04:21 -0500671 }
Chris Mason5f39d392007-10-15 16:14:19 -0400672 if (btrfs_header_nritems(mid) >
Chris Mason123abc82007-03-14 14:14:43 -0400673 BTRFS_NODEPTRS_PER_BLOCK(root) / 4)
Chris Masonbb803952007-03-01 12:04:21 -0500674 return 0;
675
Chris Mason5f39d392007-10-15 16:14:19 -0400676 if (btrfs_header_nritems(mid) < 2)
Chris Mason54aa1f42007-06-22 14:16:25 -0400677 err_on_enospc = 1;
678
Chris Mason5f39d392007-10-15 16:14:19 -0400679 left = read_node_slot(root, parent, pslot - 1);
680 if (left) {
681 wret = btrfs_cow_block(trans, root, left,
682 parent, pslot - 1, &left);
Chris Mason54aa1f42007-06-22 14:16:25 -0400683 if (wret) {
684 ret = wret;
685 goto enospc;
686 }
Chris Mason2cc58cf2007-08-27 16:49:44 -0400687 }
Chris Mason5f39d392007-10-15 16:14:19 -0400688 right = read_node_slot(root, parent, pslot + 1);
689 if (right) {
690 wret = btrfs_cow_block(trans, root, right,
691 parent, pslot + 1, &right);
Chris Mason2cc58cf2007-08-27 16:49:44 -0400692 if (wret) {
693 ret = wret;
694 goto enospc;
695 }
696 }
697
698 /* first, try to make some room in the middle buffer */
Chris Mason5f39d392007-10-15 16:14:19 -0400699 if (left) {
700 orig_slot += btrfs_header_nritems(left);
701 wret = push_node_left(trans, root, left, mid);
Chris Mason79f95c82007-03-01 15:16:26 -0500702 if (wret < 0)
703 ret = wret;
Chris Mason5f39d392007-10-15 16:14:19 -0400704 if (btrfs_header_nritems(mid) < 2)
Chris Mason54aa1f42007-06-22 14:16:25 -0400705 err_on_enospc = 1;
Chris Masonbb803952007-03-01 12:04:21 -0500706 }
Chris Mason79f95c82007-03-01 15:16:26 -0500707
708 /*
709 * then try to empty the right most buffer into the middle
710 */
Chris Mason5f39d392007-10-15 16:14:19 -0400711 if (right) {
712 wret = push_node_left(trans, root, mid, right);
Chris Mason54aa1f42007-06-22 14:16:25 -0400713 if (wret < 0 && wret != -ENOSPC)
Chris Mason79f95c82007-03-01 15:16:26 -0500714 ret = wret;
Chris Mason5f39d392007-10-15 16:14:19 -0400715 if (btrfs_header_nritems(right) == 0) {
Chris Masondb945352007-10-15 16:15:53 -0400716 u64 bytenr = right->start;
Chris Mason7bb86312007-12-11 09:25:06 -0500717 u64 generation = btrfs_header_generation(parent);
Chris Masondb945352007-10-15 16:15:53 -0400718 u32 blocksize = right->len;
719
Chris Mason5f39d392007-10-15 16:14:19 -0400720 clean_tree_block(trans, root, right);
721 wait_on_tree_block_writeback(root, right);
722 free_extent_buffer(right);
Chris Masonbb803952007-03-01 12:04:21 -0500723 right = NULL;
Chris Masone089f052007-03-16 16:20:31 -0400724 wret = del_ptr(trans, root, path, level + 1, pslot +
725 1);
Chris Masonbb803952007-03-01 12:04:21 -0500726 if (wret)
727 ret = wret;
Chris Masondb945352007-10-15 16:15:53 -0400728 wret = btrfs_free_extent(trans, root, bytenr,
Chris Mason7bb86312007-12-11 09:25:06 -0500729 blocksize,
730 btrfs_header_owner(parent),
731 generation, 0, 0, 1);
Chris Masonbb803952007-03-01 12:04:21 -0500732 if (wret)
733 ret = wret;
734 } else {
Chris Mason5f39d392007-10-15 16:14:19 -0400735 struct btrfs_disk_key right_key;
736 btrfs_node_key(right, &right_key, 0);
737 btrfs_set_node_key(parent, &right_key, pslot + 1);
738 btrfs_mark_buffer_dirty(parent);
Chris Masonbb803952007-03-01 12:04:21 -0500739 }
740 }
Chris Mason5f39d392007-10-15 16:14:19 -0400741 if (btrfs_header_nritems(mid) == 1) {
Chris Mason79f95c82007-03-01 15:16:26 -0500742 /*
743 * we're not allowed to leave a node with one item in the
744 * tree during a delete. A deletion from lower in the tree
745 * could try to delete the only pointer in this node.
746 * So, pull some keys from the left.
747 * There has to be a left pointer at this point because
748 * otherwise we would have pulled some pointers from the
749 * right
750 */
Chris Mason5f39d392007-10-15 16:14:19 -0400751 BUG_ON(!left);
752 wret = balance_node_right(trans, root, mid, left);
Chris Mason54aa1f42007-06-22 14:16:25 -0400753 if (wret < 0) {
Chris Mason79f95c82007-03-01 15:16:26 -0500754 ret = wret;
Chris Mason54aa1f42007-06-22 14:16:25 -0400755 goto enospc;
756 }
Chris Mason79f95c82007-03-01 15:16:26 -0500757 BUG_ON(wret == 1);
758 }
Chris Mason5f39d392007-10-15 16:14:19 -0400759 if (btrfs_header_nritems(mid) == 0) {
Chris Mason79f95c82007-03-01 15:16:26 -0500760 /* we've managed to empty the middle node, drop it */
Chris Mason7bb86312007-12-11 09:25:06 -0500761 u64 root_gen = btrfs_header_generation(parent);
Chris Masondb945352007-10-15 16:15:53 -0400762 u64 bytenr = mid->start;
763 u32 blocksize = mid->len;
Chris Mason5f39d392007-10-15 16:14:19 -0400764 clean_tree_block(trans, root, mid);
765 wait_on_tree_block_writeback(root, mid);
766 free_extent_buffer(mid);
Chris Masonbb803952007-03-01 12:04:21 -0500767 mid = NULL;
Chris Masone089f052007-03-16 16:20:31 -0400768 wret = del_ptr(trans, root, path, level + 1, pslot);
Chris Masonbb803952007-03-01 12:04:21 -0500769 if (wret)
770 ret = wret;
Chris Mason7bb86312007-12-11 09:25:06 -0500771 wret = btrfs_free_extent(trans, root, bytenr, blocksize,
772 btrfs_header_owner(parent),
773 root_gen, 0, 0, 1);
Chris Masonbb803952007-03-01 12:04:21 -0500774 if (wret)
775 ret = wret;
Chris Mason79f95c82007-03-01 15:16:26 -0500776 } else {
777 /* update the parent key to reflect our changes */
Chris Mason5f39d392007-10-15 16:14:19 -0400778 struct btrfs_disk_key mid_key;
779 btrfs_node_key(mid, &mid_key, 0);
780 btrfs_set_node_key(parent, &mid_key, pslot);
781 btrfs_mark_buffer_dirty(parent);
Chris Mason79f95c82007-03-01 15:16:26 -0500782 }
Chris Masonbb803952007-03-01 12:04:21 -0500783
Chris Mason79f95c82007-03-01 15:16:26 -0500784 /* update the path */
Chris Mason5f39d392007-10-15 16:14:19 -0400785 if (left) {
786 if (btrfs_header_nritems(left) > orig_slot) {
787 extent_buffer_get(left);
788 path->nodes[level] = left;
Chris Masonbb803952007-03-01 12:04:21 -0500789 path->slots[level + 1] -= 1;
790 path->slots[level] = orig_slot;
Chris Mason5f39d392007-10-15 16:14:19 -0400791 if (mid)
792 free_extent_buffer(mid);
Chris Masonbb803952007-03-01 12:04:21 -0500793 } else {
Chris Mason5f39d392007-10-15 16:14:19 -0400794 orig_slot -= btrfs_header_nritems(left);
Chris Masonbb803952007-03-01 12:04:21 -0500795 path->slots[level] = orig_slot;
796 }
797 }
Chris Mason79f95c82007-03-01 15:16:26 -0500798 /* double check we haven't messed things up */
Chris Mason123abc82007-03-14 14:14:43 -0400799 check_block(root, path, level);
Chris Masone20d96d2007-03-22 12:13:20 -0400800 if (orig_ptr !=
Chris Mason5f39d392007-10-15 16:14:19 -0400801 btrfs_node_blockptr(path->nodes[level], path->slots[level]))
Chris Mason79f95c82007-03-01 15:16:26 -0500802 BUG();
Chris Mason54aa1f42007-06-22 14:16:25 -0400803enospc:
Chris Mason5f39d392007-10-15 16:14:19 -0400804 if (right)
805 free_extent_buffer(right);
806 if (left)
807 free_extent_buffer(left);
Chris Masonbb803952007-03-01 12:04:21 -0500808 return ret;
809}
810
Chris Masone66f7092007-04-20 13:16:02 -0400811/* returns zero if the push worked, non-zero otherwise */
812static int push_nodes_for_insert(struct btrfs_trans_handle *trans,
813 struct btrfs_root *root,
814 struct btrfs_path *path, int level)
815{
Chris Mason5f39d392007-10-15 16:14:19 -0400816 struct extent_buffer *right = NULL;
817 struct extent_buffer *mid;
818 struct extent_buffer *left = NULL;
819 struct extent_buffer *parent = NULL;
Chris Masone66f7092007-04-20 13:16:02 -0400820 int ret = 0;
821 int wret;
822 int pslot;
823 int orig_slot = path->slots[level];
824 u64 orig_ptr;
825
826 if (level == 0)
827 return 1;
828
Chris Mason5f39d392007-10-15 16:14:19 -0400829 mid = path->nodes[level];
Chris Mason7bb86312007-12-11 09:25:06 -0500830 WARN_ON(btrfs_header_generation(mid) != trans->transid);
Chris Masone66f7092007-04-20 13:16:02 -0400831 orig_ptr = btrfs_node_blockptr(mid, orig_slot);
832
833 if (level < BTRFS_MAX_LEVEL - 1)
Chris Mason5f39d392007-10-15 16:14:19 -0400834 parent = path->nodes[level + 1];
Chris Masone66f7092007-04-20 13:16:02 -0400835 pslot = path->slots[level + 1];
836
Chris Mason5f39d392007-10-15 16:14:19 -0400837 if (!parent)
Chris Masone66f7092007-04-20 13:16:02 -0400838 return 1;
Chris Masone66f7092007-04-20 13:16:02 -0400839
Chris Mason5f39d392007-10-15 16:14:19 -0400840 left = read_node_slot(root, parent, pslot - 1);
Chris Masone66f7092007-04-20 13:16:02 -0400841
842 /* first, try to make some room in the middle buffer */
Chris Mason5f39d392007-10-15 16:14:19 -0400843 if (left) {
Chris Masone66f7092007-04-20 13:16:02 -0400844 u32 left_nr;
Chris Mason5f39d392007-10-15 16:14:19 -0400845 left_nr = btrfs_header_nritems(left);
Chris Mason33ade1f2007-04-20 13:48:57 -0400846 if (left_nr >= BTRFS_NODEPTRS_PER_BLOCK(root) - 1) {
847 wret = 1;
848 } else {
Chris Mason5f39d392007-10-15 16:14:19 -0400849 ret = btrfs_cow_block(trans, root, left, parent,
850 pslot - 1, &left);
Chris Mason54aa1f42007-06-22 14:16:25 -0400851 if (ret)
852 wret = 1;
853 else {
Chris Mason54aa1f42007-06-22 14:16:25 -0400854 wret = push_node_left(trans, root,
Chris Mason5f39d392007-10-15 16:14:19 -0400855 left, mid);
Chris Mason54aa1f42007-06-22 14:16:25 -0400856 }
Chris Mason33ade1f2007-04-20 13:48:57 -0400857 }
Chris Masone66f7092007-04-20 13:16:02 -0400858 if (wret < 0)
859 ret = wret;
860 if (wret == 0) {
Chris Mason5f39d392007-10-15 16:14:19 -0400861 struct btrfs_disk_key disk_key;
Chris Masone66f7092007-04-20 13:16:02 -0400862 orig_slot += left_nr;
Chris Mason5f39d392007-10-15 16:14:19 -0400863 btrfs_node_key(mid, &disk_key, 0);
864 btrfs_set_node_key(parent, &disk_key, pslot);
865 btrfs_mark_buffer_dirty(parent);
866 if (btrfs_header_nritems(left) > orig_slot) {
867 path->nodes[level] = left;
Chris Masone66f7092007-04-20 13:16:02 -0400868 path->slots[level + 1] -= 1;
869 path->slots[level] = orig_slot;
Chris Mason5f39d392007-10-15 16:14:19 -0400870 free_extent_buffer(mid);
Chris Masone66f7092007-04-20 13:16:02 -0400871 } else {
872 orig_slot -=
Chris Mason5f39d392007-10-15 16:14:19 -0400873 btrfs_header_nritems(left);
Chris Masone66f7092007-04-20 13:16:02 -0400874 path->slots[level] = orig_slot;
Chris Mason5f39d392007-10-15 16:14:19 -0400875 free_extent_buffer(left);
Chris Masone66f7092007-04-20 13:16:02 -0400876 }
Chris Masone66f7092007-04-20 13:16:02 -0400877 return 0;
878 }
Chris Mason5f39d392007-10-15 16:14:19 -0400879 free_extent_buffer(left);
Chris Masone66f7092007-04-20 13:16:02 -0400880 }
Chris Mason5f39d392007-10-15 16:14:19 -0400881 right= read_node_slot(root, parent, pslot + 1);
Chris Masone66f7092007-04-20 13:16:02 -0400882
883 /*
884 * then try to empty the right most buffer into the middle
885 */
Chris Mason5f39d392007-10-15 16:14:19 -0400886 if (right) {
Chris Mason33ade1f2007-04-20 13:48:57 -0400887 u32 right_nr;
Chris Mason5f39d392007-10-15 16:14:19 -0400888 right_nr = btrfs_header_nritems(right);
Chris Mason33ade1f2007-04-20 13:48:57 -0400889 if (right_nr >= BTRFS_NODEPTRS_PER_BLOCK(root) - 1) {
890 wret = 1;
891 } else {
Chris Mason5f39d392007-10-15 16:14:19 -0400892 ret = btrfs_cow_block(trans, root, right,
893 parent, pslot + 1,
894 &right);
Chris Mason54aa1f42007-06-22 14:16:25 -0400895 if (ret)
896 wret = 1;
897 else {
Chris Mason54aa1f42007-06-22 14:16:25 -0400898 wret = balance_node_right(trans, root,
Chris Mason5f39d392007-10-15 16:14:19 -0400899 right, mid);
Chris Mason54aa1f42007-06-22 14:16:25 -0400900 }
Chris Mason33ade1f2007-04-20 13:48:57 -0400901 }
Chris Masone66f7092007-04-20 13:16:02 -0400902 if (wret < 0)
903 ret = wret;
904 if (wret == 0) {
Chris Mason5f39d392007-10-15 16:14:19 -0400905 struct btrfs_disk_key disk_key;
906
907 btrfs_node_key(right, &disk_key, 0);
908 btrfs_set_node_key(parent, &disk_key, pslot + 1);
909 btrfs_mark_buffer_dirty(parent);
910
911 if (btrfs_header_nritems(mid) <= orig_slot) {
912 path->nodes[level] = right;
Chris Masone66f7092007-04-20 13:16:02 -0400913 path->slots[level + 1] += 1;
914 path->slots[level] = orig_slot -
Chris Mason5f39d392007-10-15 16:14:19 -0400915 btrfs_header_nritems(mid);
916 free_extent_buffer(mid);
Chris Masone66f7092007-04-20 13:16:02 -0400917 } else {
Chris Mason5f39d392007-10-15 16:14:19 -0400918 free_extent_buffer(right);
Chris Masone66f7092007-04-20 13:16:02 -0400919 }
Chris Masone66f7092007-04-20 13:16:02 -0400920 return 0;
921 }
Chris Mason5f39d392007-10-15 16:14:19 -0400922 free_extent_buffer(right);
Chris Masone66f7092007-04-20 13:16:02 -0400923 }
Chris Masone66f7092007-04-20 13:16:02 -0400924 return 1;
925}
926
Chris Mason74123bd2007-02-02 11:05:29 -0500927/*
Chris Mason3c69fae2007-08-07 15:52:22 -0400928 * readahead one full node of leaves
929 */
930static void reada_for_search(struct btrfs_root *root, struct btrfs_path *path,
Chris Mason6702ed42007-08-07 16:15:09 -0400931 int level, int slot)
Chris Mason3c69fae2007-08-07 15:52:22 -0400932{
Chris Mason5f39d392007-10-15 16:14:19 -0400933 struct extent_buffer *node;
Chris Mason3c69fae2007-08-07 15:52:22 -0400934 u32 nritems;
Chris Mason3c69fae2007-08-07 15:52:22 -0400935 u64 search;
Chris Mason6b800532007-10-15 16:17:34 -0400936 u64 lowest_read;
937 u64 highest_read;
938 u64 nread = 0;
Chris Mason3c69fae2007-08-07 15:52:22 -0400939 int direction = path->reada;
Chris Mason5f39d392007-10-15 16:14:19 -0400940 struct extent_buffer *eb;
Chris Mason6b800532007-10-15 16:17:34 -0400941 u32 nr;
942 u32 blocksize;
943 u32 nscan = 0;
Chris Masondb945352007-10-15 16:15:53 -0400944
Chris Masona6b6e752007-10-15 16:22:39 -0400945 if (level != 1)
Chris Mason3c69fae2007-08-07 15:52:22 -0400946 return;
947
Chris Mason6702ed42007-08-07 16:15:09 -0400948 if (!path->nodes[level])
949 return;
950
Chris Mason5f39d392007-10-15 16:14:19 -0400951 node = path->nodes[level];
Chris Mason3c69fae2007-08-07 15:52:22 -0400952 search = btrfs_node_blockptr(node, slot);
Chris Mason6b800532007-10-15 16:17:34 -0400953 blocksize = btrfs_level_size(root, level - 1);
954 eb = btrfs_find_tree_block(root, search, blocksize);
Chris Mason5f39d392007-10-15 16:14:19 -0400955 if (eb) {
956 free_extent_buffer(eb);
Chris Mason3c69fae2007-08-07 15:52:22 -0400957 return;
958 }
959
Chris Mason6b800532007-10-15 16:17:34 -0400960 highest_read = search;
961 lowest_read = search;
962
Chris Mason5f39d392007-10-15 16:14:19 -0400963 nritems = btrfs_header_nritems(node);
Chris Mason6b800532007-10-15 16:17:34 -0400964 nr = slot;
Chris Mason3c69fae2007-08-07 15:52:22 -0400965 while(1) {
Chris Mason6b800532007-10-15 16:17:34 -0400966 if (direction < 0) {
967 if (nr == 0)
968 break;
969 nr--;
970 } else if (direction > 0) {
971 nr++;
972 if (nr >= nritems)
973 break;
Chris Mason3c69fae2007-08-07 15:52:22 -0400974 }
Chris Mason6b800532007-10-15 16:17:34 -0400975 search = btrfs_node_blockptr(node, nr);
976 if ((search >= lowest_read && search <= highest_read) ||
977 (search < lowest_read && lowest_read - search <= 32768) ||
978 (search > highest_read && search - highest_read <= 32768)) {
979 readahead_tree_block(root, search, blocksize);
980 nread += blocksize;
981 }
982 nscan++;
983 if (path->reada < 2 && (nread > (256 * 1024) || nscan > 32))
984 break;
985 if(nread > (1024 * 1024) || nscan > 128)
986 break;
987
988 if (search < lowest_read)
989 lowest_read = search;
990 if (search > highest_read)
991 highest_read = search;
Chris Mason3c69fae2007-08-07 15:52:22 -0400992 }
993}
994/*
Chris Mason74123bd2007-02-02 11:05:29 -0500995 * look for key in the tree. path is filled in with nodes along the way
996 * if key is found, we return zero and you can find the item in the leaf
997 * level of the path (level 0)
998 *
999 * If the key isn't found, the path points to the slot where it should
Chris Masonaa5d6be2007-02-28 16:35:06 -05001000 * be inserted, and 1 is returned. If there are other errors during the
1001 * search a negative error number is returned.
Chris Mason97571fd2007-02-24 13:39:08 -05001002 *
1003 * if ins_len > 0, nodes and leaves will be split as we walk down the
1004 * tree. if ins_len < 0, nodes will be merged as we walk down the tree (if
1005 * possible)
Chris Mason74123bd2007-02-02 11:05:29 -05001006 */
Chris Masone089f052007-03-16 16:20:31 -04001007int btrfs_search_slot(struct btrfs_trans_handle *trans, struct btrfs_root
1008 *root, struct btrfs_key *key, struct btrfs_path *p, int
1009 ins_len, int cow)
Chris Masonbe0e5c02007-01-26 15:51:26 -05001010{
Chris Mason5f39d392007-10-15 16:14:19 -04001011 struct extent_buffer *b;
Chris Masondb945352007-10-15 16:15:53 -04001012 u64 bytenr;
Chris Mason74493f72007-12-11 09:25:06 -05001013 u64 ptr_gen;
Chris Masonbe0e5c02007-01-26 15:51:26 -05001014 int slot;
1015 int ret;
1016 int level;
Chris Mason3c69fae2007-08-07 15:52:22 -04001017 int should_reada = p->reada;
Chris Mason9f3a7422007-08-07 15:52:19 -04001018 u8 lowest_level = 0;
1019
Chris Mason6702ed42007-08-07 16:15:09 -04001020 lowest_level = p->lowest_level;
1021 WARN_ON(lowest_level && ins_len);
Chris Mason22b0ebd2007-03-30 08:47:31 -04001022 WARN_ON(p->nodes[0] != NULL);
1023 WARN_ON(!mutex_is_locked(&root->fs_info->fs_mutex));
Chris Masonbb803952007-03-01 12:04:21 -05001024again:
1025 b = root->node;
Chris Mason5f39d392007-10-15 16:14:19 -04001026 extent_buffer_get(b);
Chris Masoneb60cea2007-02-02 09:18:22 -05001027 while (b) {
Chris Mason5f39d392007-10-15 16:14:19 -04001028 level = btrfs_header_level(b);
Chris Mason02217ed2007-03-02 16:08:05 -05001029 if (cow) {
1030 int wret;
Chris Masone20d96d2007-03-22 12:13:20 -04001031 wret = btrfs_cow_block(trans, root, b,
1032 p->nodes[level + 1],
1033 p->slots[level + 1],
Yan252c38f2007-08-29 09:11:44 -04001034 &b);
Chris Mason54aa1f42007-06-22 14:16:25 -04001035 if (wret) {
Chris Mason5f39d392007-10-15 16:14:19 -04001036 free_extent_buffer(b);
Chris Mason54aa1f42007-06-22 14:16:25 -04001037 return wret;
1038 }
Chris Mason02217ed2007-03-02 16:08:05 -05001039 }
1040 BUG_ON(!cow && ins_len);
Chris Mason5f39d392007-10-15 16:14:19 -04001041 if (level != btrfs_header_level(b))
Chris Mason2c90e5d2007-04-02 10:50:19 -04001042 WARN_ON(1);
Chris Mason5f39d392007-10-15 16:14:19 -04001043 level = btrfs_header_level(b);
Chris Masoneb60cea2007-02-02 09:18:22 -05001044 p->nodes[level] = b;
Chris Mason123abc82007-03-14 14:14:43 -04001045 ret = check_block(root, p, level);
Chris Masonaa5d6be2007-02-28 16:35:06 -05001046 if (ret)
1047 return -1;
Chris Mason5f39d392007-10-15 16:14:19 -04001048 ret = bin_search(b, key, level, &slot);
1049 if (level != 0) {
Chris Masonbe0e5c02007-01-26 15:51:26 -05001050 if (ret && slot > 0)
1051 slot -= 1;
1052 p->slots[level] = slot;
Chris Mason5f39d392007-10-15 16:14:19 -04001053 if (ins_len > 0 && btrfs_header_nritems(b) >=
Chris Masond4dbff92007-04-04 14:08:15 -04001054 BTRFS_NODEPTRS_PER_BLOCK(root) - 1) {
Chris Masone089f052007-03-16 16:20:31 -04001055 int sret = split_node(trans, root, p, level);
Chris Mason5c680ed2007-02-22 11:39:13 -05001056 BUG_ON(sret > 0);
1057 if (sret)
1058 return sret;
1059 b = p->nodes[level];
Chris Mason5c680ed2007-02-22 11:39:13 -05001060 slot = p->slots[level];
Chris Masonbb803952007-03-01 12:04:21 -05001061 } else if (ins_len < 0) {
Chris Masone089f052007-03-16 16:20:31 -04001062 int sret = balance_level(trans, root, p,
1063 level);
Chris Masonbb803952007-03-01 12:04:21 -05001064 if (sret)
1065 return sret;
1066 b = p->nodes[level];
Chris Masonf510cfe2007-10-15 16:14:48 -04001067 if (!b) {
1068 btrfs_release_path(NULL, p);
Chris Masonbb803952007-03-01 12:04:21 -05001069 goto again;
Chris Masonf510cfe2007-10-15 16:14:48 -04001070 }
Chris Masonbb803952007-03-01 12:04:21 -05001071 slot = p->slots[level];
Chris Mason5f39d392007-10-15 16:14:19 -04001072 BUG_ON(btrfs_header_nritems(b) == 1);
Chris Mason5c680ed2007-02-22 11:39:13 -05001073 }
Chris Mason9f3a7422007-08-07 15:52:19 -04001074 /* this is only true while dropping a snapshot */
1075 if (level == lowest_level)
1076 break;
Chris Masondb945352007-10-15 16:15:53 -04001077 bytenr = btrfs_node_blockptr(b, slot);
Chris Mason74493f72007-12-11 09:25:06 -05001078 ptr_gen = btrfs_node_ptr_generation(b, slot);
Chris Mason6702ed42007-08-07 16:15:09 -04001079 if (should_reada)
1080 reada_for_search(root, p, level, slot);
Chris Masondb945352007-10-15 16:15:53 -04001081 b = read_tree_block(root, bytenr,
1082 btrfs_level_size(root, level - 1));
Chris Mason74493f72007-12-11 09:25:06 -05001083 if (ptr_gen != btrfs_header_generation(b)) {
1084 printk("block %llu bad gen wanted %llu "
1085 "found %llu\n",
1086 (unsigned long long)b->start,
1087 (unsigned long long)ptr_gen,
1088 (unsigned long long)btrfs_header_generation(b));
1089 }
Chris Masonbe0e5c02007-01-26 15:51:26 -05001090 } else {
1091 p->slots[level] = slot;
Chris Mason5f39d392007-10-15 16:14:19 -04001092 if (ins_len > 0 && btrfs_leaf_free_space(root, b) <
Chris Mason0783fcf2007-03-12 20:12:07 -04001093 sizeof(struct btrfs_item) + ins_len) {
Chris Masond4dbff92007-04-04 14:08:15 -04001094 int sret = split_leaf(trans, root, key,
Chris Masoncc0c5532007-10-25 15:42:57 -04001095 p, ins_len, ret == 0);
Chris Mason5c680ed2007-02-22 11:39:13 -05001096 BUG_ON(sret > 0);
1097 if (sret)
1098 return sret;
1099 }
Chris Masonbe0e5c02007-01-26 15:51:26 -05001100 return ret;
1101 }
1102 }
Chris Masonaa5d6be2007-02-28 16:35:06 -05001103 return 1;
Chris Masonbe0e5c02007-01-26 15:51:26 -05001104}
1105
Chris Mason74123bd2007-02-02 11:05:29 -05001106/*
1107 * adjust the pointers going up the tree, starting at level
1108 * making sure the right key of each node is points to 'key'.
1109 * This is used after shifting pointers to the left, so it stops
1110 * fixing up pointers when a given leaf/node is not in slot 0 of the
1111 * higher levels
Chris Masonaa5d6be2007-02-28 16:35:06 -05001112 *
1113 * If this fails to write a tree block, it returns -1, but continues
1114 * fixing up the blocks in ram so the tree is consistent.
Chris Mason74123bd2007-02-02 11:05:29 -05001115 */
Chris Mason5f39d392007-10-15 16:14:19 -04001116static int fixup_low_keys(struct btrfs_trans_handle *trans,
1117 struct btrfs_root *root, struct btrfs_path *path,
1118 struct btrfs_disk_key *key, int level)
Chris Masonbe0e5c02007-01-26 15:51:26 -05001119{
1120 int i;
Chris Masonaa5d6be2007-02-28 16:35:06 -05001121 int ret = 0;
Chris Mason5f39d392007-10-15 16:14:19 -04001122 struct extent_buffer *t;
1123
Chris Mason234b63a2007-03-13 10:46:10 -04001124 for (i = level; i < BTRFS_MAX_LEVEL; i++) {
Chris Masonbe0e5c02007-01-26 15:51:26 -05001125 int tslot = path->slots[i];
Chris Masoneb60cea2007-02-02 09:18:22 -05001126 if (!path->nodes[i])
Chris Masonbe0e5c02007-01-26 15:51:26 -05001127 break;
Chris Mason5f39d392007-10-15 16:14:19 -04001128 t = path->nodes[i];
1129 btrfs_set_node_key(t, key, tslot);
Chris Masond6025572007-03-30 14:27:56 -04001130 btrfs_mark_buffer_dirty(path->nodes[i]);
Chris Masonbe0e5c02007-01-26 15:51:26 -05001131 if (tslot != 0)
1132 break;
1133 }
Chris Masonaa5d6be2007-02-28 16:35:06 -05001134 return ret;
Chris Masonbe0e5c02007-01-26 15:51:26 -05001135}
1136
Chris Mason74123bd2007-02-02 11:05:29 -05001137/*
1138 * try to push data from one node into the next node left in the
Chris Mason79f95c82007-03-01 15:16:26 -05001139 * tree.
Chris Masonaa5d6be2007-02-28 16:35:06 -05001140 *
1141 * returns 0 if some ptrs were pushed left, < 0 if there was some horrible
1142 * error, and > 0 if there was no room in the left hand block.
Chris Mason74123bd2007-02-02 11:05:29 -05001143 */
Chris Masone089f052007-03-16 16:20:31 -04001144static int push_node_left(struct btrfs_trans_handle *trans, struct btrfs_root
Chris Mason5f39d392007-10-15 16:14:19 -04001145 *root, struct extent_buffer *dst,
1146 struct extent_buffer *src)
Chris Masonbe0e5c02007-01-26 15:51:26 -05001147{
Chris Masonbe0e5c02007-01-26 15:51:26 -05001148 int push_items = 0;
Chris Masonbb803952007-03-01 12:04:21 -05001149 int src_nritems;
1150 int dst_nritems;
Chris Masonaa5d6be2007-02-28 16:35:06 -05001151 int ret = 0;
Chris Masonbe0e5c02007-01-26 15:51:26 -05001152
Chris Mason5f39d392007-10-15 16:14:19 -04001153 src_nritems = btrfs_header_nritems(src);
1154 dst_nritems = btrfs_header_nritems(dst);
Chris Mason123abc82007-03-14 14:14:43 -04001155 push_items = BTRFS_NODEPTRS_PER_BLOCK(root) - dst_nritems;
Chris Mason7bb86312007-12-11 09:25:06 -05001156 WARN_ON(btrfs_header_generation(src) != trans->transid);
1157 WARN_ON(btrfs_header_generation(dst) != trans->transid);
Chris Mason54aa1f42007-06-22 14:16:25 -04001158
Chris Masoneb60cea2007-02-02 09:18:22 -05001159 if (push_items <= 0) {
Chris Masonbe0e5c02007-01-26 15:51:26 -05001160 return 1;
Chris Masoneb60cea2007-02-02 09:18:22 -05001161 }
Chris Masonbe0e5c02007-01-26 15:51:26 -05001162
1163 if (src_nritems < push_items)
Chris Mason79f95c82007-03-01 15:16:26 -05001164 push_items = src_nritems;
1165
Chris Mason5f39d392007-10-15 16:14:19 -04001166 copy_extent_buffer(dst, src,
1167 btrfs_node_key_ptr_offset(dst_nritems),
1168 btrfs_node_key_ptr_offset(0),
1169 push_items * sizeof(struct btrfs_key_ptr));
1170
Chris Masonbb803952007-03-01 12:04:21 -05001171 if (push_items < src_nritems) {
Chris Mason5f39d392007-10-15 16:14:19 -04001172 memmove_extent_buffer(src, btrfs_node_key_ptr_offset(0),
1173 btrfs_node_key_ptr_offset(push_items),
1174 (src_nritems - push_items) *
1175 sizeof(struct btrfs_key_ptr));
Chris Masonbb803952007-03-01 12:04:21 -05001176 }
Chris Mason5f39d392007-10-15 16:14:19 -04001177 btrfs_set_header_nritems(src, src_nritems - push_items);
1178 btrfs_set_header_nritems(dst, dst_nritems + push_items);
1179 btrfs_mark_buffer_dirty(src);
1180 btrfs_mark_buffer_dirty(dst);
Chris Masonbb803952007-03-01 12:04:21 -05001181 return ret;
Chris Masonbe0e5c02007-01-26 15:51:26 -05001182}
1183
Chris Mason97571fd2007-02-24 13:39:08 -05001184/*
Chris Mason79f95c82007-03-01 15:16:26 -05001185 * try to push data from one node into the next node right in the
1186 * tree.
1187 *
1188 * returns 0 if some ptrs were pushed, < 0 if there was some horrible
1189 * error, and > 0 if there was no room in the right hand block.
1190 *
1191 * this will only push up to 1/2 the contents of the left node over
1192 */
Chris Mason5f39d392007-10-15 16:14:19 -04001193static int balance_node_right(struct btrfs_trans_handle *trans,
1194 struct btrfs_root *root,
1195 struct extent_buffer *dst,
1196 struct extent_buffer *src)
Chris Mason79f95c82007-03-01 15:16:26 -05001197{
Chris Mason79f95c82007-03-01 15:16:26 -05001198 int push_items = 0;
1199 int max_push;
1200 int src_nritems;
1201 int dst_nritems;
1202 int ret = 0;
Chris Mason79f95c82007-03-01 15:16:26 -05001203
Chris Mason7bb86312007-12-11 09:25:06 -05001204 WARN_ON(btrfs_header_generation(src) != trans->transid);
1205 WARN_ON(btrfs_header_generation(dst) != trans->transid);
1206
Chris Mason5f39d392007-10-15 16:14:19 -04001207 src_nritems = btrfs_header_nritems(src);
1208 dst_nritems = btrfs_header_nritems(dst);
Chris Mason123abc82007-03-14 14:14:43 -04001209 push_items = BTRFS_NODEPTRS_PER_BLOCK(root) - dst_nritems;
Chris Mason5f39d392007-10-15 16:14:19 -04001210 if (push_items <= 0)
Chris Mason79f95c82007-03-01 15:16:26 -05001211 return 1;
Chris Mason79f95c82007-03-01 15:16:26 -05001212
1213 max_push = src_nritems / 2 + 1;
1214 /* don't try to empty the node */
Yan252c38f2007-08-29 09:11:44 -04001215 if (max_push >= src_nritems)
Chris Mason79f95c82007-03-01 15:16:26 -05001216 return 1;
Yan252c38f2007-08-29 09:11:44 -04001217
Chris Mason79f95c82007-03-01 15:16:26 -05001218 if (max_push < push_items)
1219 push_items = max_push;
1220
Chris Mason5f39d392007-10-15 16:14:19 -04001221 memmove_extent_buffer(dst, btrfs_node_key_ptr_offset(push_items),
1222 btrfs_node_key_ptr_offset(0),
1223 (dst_nritems) *
1224 sizeof(struct btrfs_key_ptr));
Chris Masond6025572007-03-30 14:27:56 -04001225
Chris Mason5f39d392007-10-15 16:14:19 -04001226 copy_extent_buffer(dst, src,
1227 btrfs_node_key_ptr_offset(0),
1228 btrfs_node_key_ptr_offset(src_nritems - push_items),
1229 push_items * sizeof(struct btrfs_key_ptr));
Chris Mason79f95c82007-03-01 15:16:26 -05001230
Chris Mason5f39d392007-10-15 16:14:19 -04001231 btrfs_set_header_nritems(src, src_nritems - push_items);
1232 btrfs_set_header_nritems(dst, dst_nritems + push_items);
Chris Mason79f95c82007-03-01 15:16:26 -05001233
Chris Mason5f39d392007-10-15 16:14:19 -04001234 btrfs_mark_buffer_dirty(src);
1235 btrfs_mark_buffer_dirty(dst);
Chris Mason79f95c82007-03-01 15:16:26 -05001236 return ret;
1237}
1238
1239/*
Chris Mason97571fd2007-02-24 13:39:08 -05001240 * helper function to insert a new root level in the tree.
1241 * A new node is allocated, and a single item is inserted to
1242 * point to the existing root
Chris Masonaa5d6be2007-02-28 16:35:06 -05001243 *
1244 * returns zero on success or < 0 on failure.
Chris Mason97571fd2007-02-24 13:39:08 -05001245 */
Chris Mason5f39d392007-10-15 16:14:19 -04001246static int insert_new_root(struct btrfs_trans_handle *trans,
1247 struct btrfs_root *root,
1248 struct btrfs_path *path, int level)
Chris Mason5c680ed2007-02-22 11:39:13 -05001249{
Chris Mason7bb86312007-12-11 09:25:06 -05001250 u64 root_gen;
1251 u64 lower_gen;
Chris Mason5f39d392007-10-15 16:14:19 -04001252 struct extent_buffer *lower;
1253 struct extent_buffer *c;
1254 struct btrfs_disk_key lower_key;
Chris Mason5c680ed2007-02-22 11:39:13 -05001255
1256 BUG_ON(path->nodes[level]);
1257 BUG_ON(path->nodes[level-1] != root->node);
1258
Chris Mason7bb86312007-12-11 09:25:06 -05001259 if (root->ref_cows)
1260 root_gen = trans->transid;
1261 else
1262 root_gen = 0;
1263
1264 lower = path->nodes[level-1];
1265 if (level == 1)
1266 btrfs_item_key(lower, &lower_key, 0);
1267 else
1268 btrfs_node_key(lower, &lower_key, 0);
1269
1270 c = __btrfs_alloc_free_block(trans, root, root->nodesize,
1271 root->root_key.objectid,
1272 root_gen, lower_key.objectid, level,
Chris Masondb945352007-10-15 16:15:53 -04001273 root->node->start, 0);
Chris Mason5f39d392007-10-15 16:14:19 -04001274 if (IS_ERR(c))
1275 return PTR_ERR(c);
1276 memset_extent_buffer(c, 0, 0, root->nodesize);
1277 btrfs_set_header_nritems(c, 1);
1278 btrfs_set_header_level(c, level);
Chris Masondb945352007-10-15 16:15:53 -04001279 btrfs_set_header_bytenr(c, c->start);
Chris Mason5f39d392007-10-15 16:14:19 -04001280 btrfs_set_header_generation(c, trans->transid);
1281 btrfs_set_header_owner(c, root->root_key.objectid);
Chris Masond5719762007-03-23 10:01:08 -04001282
Chris Mason5f39d392007-10-15 16:14:19 -04001283 write_extent_buffer(c, root->fs_info->fsid,
1284 (unsigned long)btrfs_header_fsid(c),
1285 BTRFS_FSID_SIZE);
Chris Mason5f39d392007-10-15 16:14:19 -04001286 btrfs_set_node_key(c, &lower_key, 0);
Chris Masondb945352007-10-15 16:15:53 -04001287 btrfs_set_node_blockptr(c, 0, lower->start);
Chris Mason7bb86312007-12-11 09:25:06 -05001288 lower_gen = btrfs_header_generation(lower);
1289 WARN_ON(lower_gen == 0);
1290
1291 btrfs_set_node_ptr_generation(c, 0, lower_gen);
Chris Mason5f39d392007-10-15 16:14:19 -04001292
1293 btrfs_mark_buffer_dirty(c);
Chris Masond5719762007-03-23 10:01:08 -04001294
Chris Mason5c680ed2007-02-22 11:39:13 -05001295 /* the super has an extra ref to root->node */
Chris Mason5f39d392007-10-15 16:14:19 -04001296 free_extent_buffer(root->node);
1297 root->node = c;
1298 extent_buffer_get(c);
1299 path->nodes[level] = c;
Chris Mason5c680ed2007-02-22 11:39:13 -05001300 path->slots[level] = 0;
Chris Mason7bb86312007-12-11 09:25:06 -05001301
1302 if (root->ref_cows && lower_gen != trans->transid) {
1303 struct btrfs_path *back_path = btrfs_alloc_path();
1304 int ret;
1305 ret = btrfs_insert_extent_backref(trans,
1306 root->fs_info->extent_root,
1307 path, lower->start,
1308 root->root_key.objectid,
1309 trans->transid, 0, 0);
1310 BUG_ON(ret);
1311 btrfs_free_path(back_path);
1312 }
Chris Mason5c680ed2007-02-22 11:39:13 -05001313 return 0;
1314}
1315
Chris Mason74123bd2007-02-02 11:05:29 -05001316/*
1317 * worker function to insert a single pointer in a node.
1318 * the node should have enough room for the pointer already
Chris Mason97571fd2007-02-24 13:39:08 -05001319 *
Chris Mason74123bd2007-02-02 11:05:29 -05001320 * slot and level indicate where you want the key to go, and
1321 * blocknr is the block the key points to.
Chris Masonaa5d6be2007-02-28 16:35:06 -05001322 *
1323 * returns zero on success and < 0 on any error
Chris Mason74123bd2007-02-02 11:05:29 -05001324 */
Chris Masone089f052007-03-16 16:20:31 -04001325static int insert_ptr(struct btrfs_trans_handle *trans, struct btrfs_root
1326 *root, struct btrfs_path *path, struct btrfs_disk_key
Chris Masondb945352007-10-15 16:15:53 -04001327 *key, u64 bytenr, int slot, int level)
Chris Mason74123bd2007-02-02 11:05:29 -05001328{
Chris Mason5f39d392007-10-15 16:14:19 -04001329 struct extent_buffer *lower;
Chris Mason74123bd2007-02-02 11:05:29 -05001330 int nritems;
Chris Mason5c680ed2007-02-22 11:39:13 -05001331
1332 BUG_ON(!path->nodes[level]);
Chris Mason5f39d392007-10-15 16:14:19 -04001333 lower = path->nodes[level];
1334 nritems = btrfs_header_nritems(lower);
Chris Mason74123bd2007-02-02 11:05:29 -05001335 if (slot > nritems)
1336 BUG();
Chris Mason123abc82007-03-14 14:14:43 -04001337 if (nritems == BTRFS_NODEPTRS_PER_BLOCK(root))
Chris Mason74123bd2007-02-02 11:05:29 -05001338 BUG();
1339 if (slot != nritems) {
Chris Mason5f39d392007-10-15 16:14:19 -04001340 memmove_extent_buffer(lower,
1341 btrfs_node_key_ptr_offset(slot + 1),
1342 btrfs_node_key_ptr_offset(slot),
Chris Masond6025572007-03-30 14:27:56 -04001343 (nritems - slot) * sizeof(struct btrfs_key_ptr));
Chris Mason74123bd2007-02-02 11:05:29 -05001344 }
Chris Mason5f39d392007-10-15 16:14:19 -04001345 btrfs_set_node_key(lower, key, slot);
Chris Masondb945352007-10-15 16:15:53 -04001346 btrfs_set_node_blockptr(lower, slot, bytenr);
Chris Mason74493f72007-12-11 09:25:06 -05001347 WARN_ON(trans->transid == 0);
1348 btrfs_set_node_ptr_generation(lower, slot, trans->transid);
Chris Mason5f39d392007-10-15 16:14:19 -04001349 btrfs_set_header_nritems(lower, nritems + 1);
1350 btrfs_mark_buffer_dirty(lower);
Chris Mason74123bd2007-02-02 11:05:29 -05001351 return 0;
1352}
1353
Chris Mason97571fd2007-02-24 13:39:08 -05001354/*
1355 * split the node at the specified level in path in two.
1356 * The path is corrected to point to the appropriate node after the split
1357 *
1358 * Before splitting this tries to make some room in the node by pushing
1359 * left and right, if either one works, it returns right away.
Chris Masonaa5d6be2007-02-28 16:35:06 -05001360 *
1361 * returns 0 on success and < 0 on failure
Chris Mason97571fd2007-02-24 13:39:08 -05001362 */
Chris Masone089f052007-03-16 16:20:31 -04001363static int split_node(struct btrfs_trans_handle *trans, struct btrfs_root
1364 *root, struct btrfs_path *path, int level)
Chris Masonbe0e5c02007-01-26 15:51:26 -05001365{
Chris Mason7bb86312007-12-11 09:25:06 -05001366 u64 root_gen;
Chris Mason5f39d392007-10-15 16:14:19 -04001367 struct extent_buffer *c;
1368 struct extent_buffer *split;
1369 struct btrfs_disk_key disk_key;
Chris Masonbe0e5c02007-01-26 15:51:26 -05001370 int mid;
Chris Mason5c680ed2007-02-22 11:39:13 -05001371 int ret;
Chris Masonaa5d6be2007-02-28 16:35:06 -05001372 int wret;
Chris Mason7518a232007-03-12 12:01:18 -04001373 u32 c_nritems;
Chris Masonbe0e5c02007-01-26 15:51:26 -05001374
Chris Mason5f39d392007-10-15 16:14:19 -04001375 c = path->nodes[level];
Chris Mason7bb86312007-12-11 09:25:06 -05001376 WARN_ON(btrfs_header_generation(c) != trans->transid);
Chris Mason5f39d392007-10-15 16:14:19 -04001377 if (c == root->node) {
Chris Mason5c680ed2007-02-22 11:39:13 -05001378 /* trying to split the root, lets make a new one */
Chris Masone089f052007-03-16 16:20:31 -04001379 ret = insert_new_root(trans, root, path, level + 1);
Chris Mason5c680ed2007-02-22 11:39:13 -05001380 if (ret)
1381 return ret;
Chris Masone66f7092007-04-20 13:16:02 -04001382 } else {
1383 ret = push_nodes_for_insert(trans, root, path, level);
Chris Mason5f39d392007-10-15 16:14:19 -04001384 c = path->nodes[level];
1385 if (!ret && btrfs_header_nritems(c) <
Chris Masone66f7092007-04-20 13:16:02 -04001386 BTRFS_NODEPTRS_PER_BLOCK(root) - 1)
1387 return 0;
Chris Mason54aa1f42007-06-22 14:16:25 -04001388 if (ret < 0)
1389 return ret;
Chris Masonbe0e5c02007-01-26 15:51:26 -05001390 }
Chris Masone66f7092007-04-20 13:16:02 -04001391
Chris Mason5f39d392007-10-15 16:14:19 -04001392 c_nritems = btrfs_header_nritems(c);
Chris Mason7bb86312007-12-11 09:25:06 -05001393 if (root->ref_cows)
1394 root_gen = trans->transid;
1395 else
1396 root_gen = 0;
1397
1398 btrfs_node_key(c, &disk_key, 0);
1399 split = __btrfs_alloc_free_block(trans, root, root->nodesize,
1400 root->root_key.objectid,
1401 root_gen,
1402 btrfs_disk_key_objectid(&disk_key),
1403 level, c->start, 0);
Chris Mason5f39d392007-10-15 16:14:19 -04001404 if (IS_ERR(split))
1405 return PTR_ERR(split);
Chris Mason54aa1f42007-06-22 14:16:25 -04001406
Chris Mason5f39d392007-10-15 16:14:19 -04001407 btrfs_set_header_flags(split, btrfs_header_flags(c));
1408 btrfs_set_header_level(split, btrfs_header_level(c));
Chris Masondb945352007-10-15 16:15:53 -04001409 btrfs_set_header_bytenr(split, split->start);
Chris Mason5f39d392007-10-15 16:14:19 -04001410 btrfs_set_header_generation(split, trans->transid);
1411 btrfs_set_header_owner(split, root->root_key.objectid);
1412 write_extent_buffer(split, root->fs_info->fsid,
1413 (unsigned long)btrfs_header_fsid(split),
1414 BTRFS_FSID_SIZE);
1415
Chris Mason7518a232007-03-12 12:01:18 -04001416 mid = (c_nritems + 1) / 2;
Chris Mason5f39d392007-10-15 16:14:19 -04001417
1418 copy_extent_buffer(split, c,
1419 btrfs_node_key_ptr_offset(0),
1420 btrfs_node_key_ptr_offset(mid),
1421 (c_nritems - mid) * sizeof(struct btrfs_key_ptr));
1422 btrfs_set_header_nritems(split, c_nritems - mid);
1423 btrfs_set_header_nritems(c, mid);
Chris Masonaa5d6be2007-02-28 16:35:06 -05001424 ret = 0;
1425
Chris Mason5f39d392007-10-15 16:14:19 -04001426 btrfs_mark_buffer_dirty(c);
1427 btrfs_mark_buffer_dirty(split);
1428
1429 btrfs_node_key(split, &disk_key, 0);
Chris Masondb945352007-10-15 16:15:53 -04001430 wret = insert_ptr(trans, root, path, &disk_key, split->start,
Chris Mason5f39d392007-10-15 16:14:19 -04001431 path->slots[level + 1] + 1,
Chris Mason123abc82007-03-14 14:14:43 -04001432 level + 1);
Chris Masonaa5d6be2007-02-28 16:35:06 -05001433 if (wret)
1434 ret = wret;
1435
Chris Mason5de08d72007-02-24 06:24:44 -05001436 if (path->slots[level] >= mid) {
Chris Mason5c680ed2007-02-22 11:39:13 -05001437 path->slots[level] -= mid;
Chris Mason5f39d392007-10-15 16:14:19 -04001438 free_extent_buffer(c);
1439 path->nodes[level] = split;
Chris Mason5c680ed2007-02-22 11:39:13 -05001440 path->slots[level + 1] += 1;
1441 } else {
Chris Mason5f39d392007-10-15 16:14:19 -04001442 free_extent_buffer(split);
Chris Masonbe0e5c02007-01-26 15:51:26 -05001443 }
Chris Masonaa5d6be2007-02-28 16:35:06 -05001444 return ret;
Chris Masonbe0e5c02007-01-26 15:51:26 -05001445}
1446
Chris Mason74123bd2007-02-02 11:05:29 -05001447/*
1448 * how many bytes are required to store the items in a leaf. start
1449 * and nr indicate which items in the leaf to check. This totals up the
1450 * space used both by the item structs and the item data
1451 */
Chris Mason5f39d392007-10-15 16:14:19 -04001452static int leaf_space_used(struct extent_buffer *l, int start, int nr)
Chris Masonbe0e5c02007-01-26 15:51:26 -05001453{
1454 int data_len;
Chris Mason5f39d392007-10-15 16:14:19 -04001455 int nritems = btrfs_header_nritems(l);
Chris Masond4dbff92007-04-04 14:08:15 -04001456 int end = min(nritems, start + nr) - 1;
Chris Masonbe0e5c02007-01-26 15:51:26 -05001457
1458 if (!nr)
1459 return 0;
Chris Mason5f39d392007-10-15 16:14:19 -04001460 data_len = btrfs_item_end_nr(l, start);
1461 data_len = data_len - btrfs_item_offset_nr(l, end);
Chris Mason0783fcf2007-03-12 20:12:07 -04001462 data_len += sizeof(struct btrfs_item) * nr;
Chris Masond4dbff92007-04-04 14:08:15 -04001463 WARN_ON(data_len < 0);
Chris Masonbe0e5c02007-01-26 15:51:26 -05001464 return data_len;
1465}
1466
Chris Mason74123bd2007-02-02 11:05:29 -05001467/*
Chris Masond4dbff92007-04-04 14:08:15 -04001468 * The space between the end of the leaf items and
1469 * the start of the leaf data. IOW, how much room
1470 * the leaf has left for both items and data
1471 */
Chris Mason5f39d392007-10-15 16:14:19 -04001472int btrfs_leaf_free_space(struct btrfs_root *root, struct extent_buffer *leaf)
Chris Masond4dbff92007-04-04 14:08:15 -04001473{
Chris Mason5f39d392007-10-15 16:14:19 -04001474 int nritems = btrfs_header_nritems(leaf);
1475 int ret;
1476 ret = BTRFS_LEAF_DATA_SIZE(root) - leaf_space_used(leaf, 0, nritems);
1477 if (ret < 0) {
1478 printk("leaf free space ret %d, leaf data size %lu, used %d nritems %d\n",
Jens Axboeae2f5412007-10-19 09:22:59 -04001479 ret, (unsigned long) BTRFS_LEAF_DATA_SIZE(root),
Chris Mason5f39d392007-10-15 16:14:19 -04001480 leaf_space_used(leaf, 0, nritems), nritems);
1481 }
1482 return ret;
Chris Masond4dbff92007-04-04 14:08:15 -04001483}
1484
1485/*
Chris Mason00ec4c52007-02-24 12:47:20 -05001486 * push some data in the path leaf to the right, trying to free up at
1487 * least data_size bytes. returns zero if the push worked, nonzero otherwise
Chris Masonaa5d6be2007-02-28 16:35:06 -05001488 *
1489 * returns 1 if the push failed because the other node didn't have enough
1490 * room, 0 if everything worked out and < 0 if there were major errors.
Chris Mason00ec4c52007-02-24 12:47:20 -05001491 */
Chris Masone089f052007-03-16 16:20:31 -04001492static int push_leaf_right(struct btrfs_trans_handle *trans, struct btrfs_root
Chris Mason34a38212007-11-07 13:31:03 -05001493 *root, struct btrfs_path *path, int data_size,
1494 int empty)
Chris Mason00ec4c52007-02-24 12:47:20 -05001495{
Chris Mason5f39d392007-10-15 16:14:19 -04001496 struct extent_buffer *left = path->nodes[0];
1497 struct extent_buffer *right;
1498 struct extent_buffer *upper;
1499 struct btrfs_disk_key disk_key;
Chris Mason00ec4c52007-02-24 12:47:20 -05001500 int slot;
Chris Mason34a38212007-11-07 13:31:03 -05001501 u32 i;
Chris Mason00ec4c52007-02-24 12:47:20 -05001502 int free_space;
1503 int push_space = 0;
1504 int push_items = 0;
Chris Mason0783fcf2007-03-12 20:12:07 -04001505 struct btrfs_item *item;
Chris Mason7518a232007-03-12 12:01:18 -04001506 u32 left_nritems;
Chris Mason34a38212007-11-07 13:31:03 -05001507 u32 nr;
Chris Mason7518a232007-03-12 12:01:18 -04001508 u32 right_nritems;
Chris Mason5f39d392007-10-15 16:14:19 -04001509 u32 data_end;
Chris Masondb945352007-10-15 16:15:53 -04001510 u32 this_item_size;
Chris Mason54aa1f42007-06-22 14:16:25 -04001511 int ret;
Chris Mason00ec4c52007-02-24 12:47:20 -05001512
1513 slot = path->slots[1];
1514 if (!path->nodes[1]) {
1515 return 1;
1516 }
1517 upper = path->nodes[1];
Chris Mason5f39d392007-10-15 16:14:19 -04001518 if (slot >= btrfs_header_nritems(upper) - 1)
Chris Mason00ec4c52007-02-24 12:47:20 -05001519 return 1;
Chris Mason5f39d392007-10-15 16:14:19 -04001520
Chris Masondb945352007-10-15 16:15:53 -04001521 right = read_tree_block(root, btrfs_node_blockptr(upper, slot + 1),
1522 root->leafsize);
Chris Mason123abc82007-03-14 14:14:43 -04001523 free_space = btrfs_leaf_free_space(root, right);
Chris Mason0783fcf2007-03-12 20:12:07 -04001524 if (free_space < data_size + sizeof(struct btrfs_item)) {
Chris Mason5f39d392007-10-15 16:14:19 -04001525 free_extent_buffer(right);
Chris Mason02217ed2007-03-02 16:08:05 -05001526 return 1;
1527 }
1528
Chris Mason5f39d392007-10-15 16:14:19 -04001529 /* cow and double check */
1530 ret = btrfs_cow_block(trans, root, right, upper,
1531 slot + 1, &right);
1532 if (ret) {
1533 free_extent_buffer(right);
Chris Masona429e512007-04-18 16:15:28 -04001534 return 1;
1535 }
Chris Mason5f39d392007-10-15 16:14:19 -04001536 free_space = btrfs_leaf_free_space(root, right);
1537 if (free_space < data_size + sizeof(struct btrfs_item)) {
1538 free_extent_buffer(right);
1539 return 1;
1540 }
1541
1542 left_nritems = btrfs_header_nritems(left);
1543 if (left_nritems == 0) {
1544 free_extent_buffer(right);
1545 return 1;
1546 }
1547
Chris Mason34a38212007-11-07 13:31:03 -05001548 if (empty)
1549 nr = 0;
1550 else
1551 nr = 1;
1552
1553 i = left_nritems - 1;
1554 while (i >= nr) {
Chris Mason5f39d392007-10-15 16:14:19 -04001555 item = btrfs_item_nr(left, i);
Chris Masondb945352007-10-15 16:15:53 -04001556
Chris Mason00ec4c52007-02-24 12:47:20 -05001557 if (path->slots[0] == i)
1558 push_space += data_size + sizeof(*item);
Chris Masondb945352007-10-15 16:15:53 -04001559
1560 if (!left->map_token) {
1561 map_extent_buffer(left, (unsigned long)item,
1562 sizeof(struct btrfs_item),
1563 &left->map_token, &left->kaddr,
1564 &left->map_start, &left->map_len,
1565 KM_USER1);
1566 }
1567
1568 this_item_size = btrfs_item_size(left, item);
1569 if (this_item_size + sizeof(*item) + push_space > free_space)
Chris Mason00ec4c52007-02-24 12:47:20 -05001570 break;
1571 push_items++;
Chris Masondb945352007-10-15 16:15:53 -04001572 push_space += this_item_size + sizeof(*item);
Chris Mason34a38212007-11-07 13:31:03 -05001573 if (i == 0)
1574 break;
1575 i--;
Chris Masondb945352007-10-15 16:15:53 -04001576 }
1577 if (left->map_token) {
1578 unmap_extent_buffer(left, left->map_token, KM_USER1);
1579 left->map_token = NULL;
Chris Mason00ec4c52007-02-24 12:47:20 -05001580 }
Chris Mason5f39d392007-10-15 16:14:19 -04001581
Chris Mason00ec4c52007-02-24 12:47:20 -05001582 if (push_items == 0) {
Chris Mason5f39d392007-10-15 16:14:19 -04001583 free_extent_buffer(right);
Chris Mason00ec4c52007-02-24 12:47:20 -05001584 return 1;
1585 }
Chris Mason5f39d392007-10-15 16:14:19 -04001586
Chris Mason34a38212007-11-07 13:31:03 -05001587 if (!empty && push_items == left_nritems)
Chris Masona429e512007-04-18 16:15:28 -04001588 WARN_ON(1);
Chris Mason5f39d392007-10-15 16:14:19 -04001589
Chris Mason00ec4c52007-02-24 12:47:20 -05001590 /* push left to right */
Chris Mason5f39d392007-10-15 16:14:19 -04001591 right_nritems = btrfs_header_nritems(right);
Chris Mason34a38212007-11-07 13:31:03 -05001592
Chris Mason5f39d392007-10-15 16:14:19 -04001593 push_space = btrfs_item_end_nr(left, left_nritems - push_items);
Chris Mason123abc82007-03-14 14:14:43 -04001594 push_space -= leaf_data_end(root, left);
Chris Mason5f39d392007-10-15 16:14:19 -04001595
Chris Mason00ec4c52007-02-24 12:47:20 -05001596 /* make room in the right data area */
Chris Mason5f39d392007-10-15 16:14:19 -04001597 data_end = leaf_data_end(root, right);
1598 memmove_extent_buffer(right,
1599 btrfs_leaf_data(right) + data_end - push_space,
1600 btrfs_leaf_data(right) + data_end,
1601 BTRFS_LEAF_DATA_SIZE(root) - data_end);
1602
Chris Mason00ec4c52007-02-24 12:47:20 -05001603 /* copy from the left data area */
Chris Mason5f39d392007-10-15 16:14:19 -04001604 copy_extent_buffer(right, left, btrfs_leaf_data(right) +
Chris Masond6025572007-03-30 14:27:56 -04001605 BTRFS_LEAF_DATA_SIZE(root) - push_space,
1606 btrfs_leaf_data(left) + leaf_data_end(root, left),
1607 push_space);
Chris Mason5f39d392007-10-15 16:14:19 -04001608
1609 memmove_extent_buffer(right, btrfs_item_nr_offset(push_items),
1610 btrfs_item_nr_offset(0),
1611 right_nritems * sizeof(struct btrfs_item));
1612
Chris Mason00ec4c52007-02-24 12:47:20 -05001613 /* copy the items from left to right */
Chris Mason5f39d392007-10-15 16:14:19 -04001614 copy_extent_buffer(right, left, btrfs_item_nr_offset(0),
1615 btrfs_item_nr_offset(left_nritems - push_items),
1616 push_items * sizeof(struct btrfs_item));
Chris Mason00ec4c52007-02-24 12:47:20 -05001617
1618 /* update the item pointers */
Chris Mason7518a232007-03-12 12:01:18 -04001619 right_nritems += push_items;
Chris Mason5f39d392007-10-15 16:14:19 -04001620 btrfs_set_header_nritems(right, right_nritems);
Chris Mason123abc82007-03-14 14:14:43 -04001621 push_space = BTRFS_LEAF_DATA_SIZE(root);
Chris Mason7518a232007-03-12 12:01:18 -04001622 for (i = 0; i < right_nritems; i++) {
Chris Mason5f39d392007-10-15 16:14:19 -04001623 item = btrfs_item_nr(right, i);
Chris Masondb945352007-10-15 16:15:53 -04001624 if (!right->map_token) {
1625 map_extent_buffer(right, (unsigned long)item,
1626 sizeof(struct btrfs_item),
1627 &right->map_token, &right->kaddr,
1628 &right->map_start, &right->map_len,
1629 KM_USER1);
1630 }
1631 push_space -= btrfs_item_size(right, item);
1632 btrfs_set_item_offset(right, item, push_space);
1633 }
1634
1635 if (right->map_token) {
1636 unmap_extent_buffer(right, right->map_token, KM_USER1);
1637 right->map_token = NULL;
Chris Mason00ec4c52007-02-24 12:47:20 -05001638 }
Chris Mason7518a232007-03-12 12:01:18 -04001639 left_nritems -= push_items;
Chris Mason5f39d392007-10-15 16:14:19 -04001640 btrfs_set_header_nritems(left, left_nritems);
Chris Mason00ec4c52007-02-24 12:47:20 -05001641
Chris Mason34a38212007-11-07 13:31:03 -05001642 if (left_nritems)
1643 btrfs_mark_buffer_dirty(left);
Chris Mason5f39d392007-10-15 16:14:19 -04001644 btrfs_mark_buffer_dirty(right);
Chris Masona429e512007-04-18 16:15:28 -04001645
Chris Mason5f39d392007-10-15 16:14:19 -04001646 btrfs_item_key(right, &disk_key, 0);
1647 btrfs_set_node_key(upper, &disk_key, slot + 1);
Chris Masond6025572007-03-30 14:27:56 -04001648 btrfs_mark_buffer_dirty(upper);
Chris Mason02217ed2007-03-02 16:08:05 -05001649
Chris Mason00ec4c52007-02-24 12:47:20 -05001650 /* then fixup the leaf pointer in the path */
Chris Mason7518a232007-03-12 12:01:18 -04001651 if (path->slots[0] >= left_nritems) {
1652 path->slots[0] -= left_nritems;
Chris Mason5f39d392007-10-15 16:14:19 -04001653 free_extent_buffer(path->nodes[0]);
1654 path->nodes[0] = right;
Chris Mason00ec4c52007-02-24 12:47:20 -05001655 path->slots[1] += 1;
1656 } else {
Chris Mason5f39d392007-10-15 16:14:19 -04001657 free_extent_buffer(right);
Chris Mason00ec4c52007-02-24 12:47:20 -05001658 }
1659 return 0;
1660}
1661/*
Chris Mason74123bd2007-02-02 11:05:29 -05001662 * push some data in the path leaf to the left, trying to free up at
1663 * least data_size bytes. returns zero if the push worked, nonzero otherwise
1664 */
Chris Masone089f052007-03-16 16:20:31 -04001665static int push_leaf_left(struct btrfs_trans_handle *trans, struct btrfs_root
Chris Mason34a38212007-11-07 13:31:03 -05001666 *root, struct btrfs_path *path, int data_size,
1667 int empty)
Chris Masonbe0e5c02007-01-26 15:51:26 -05001668{
Chris Mason5f39d392007-10-15 16:14:19 -04001669 struct btrfs_disk_key disk_key;
1670 struct extent_buffer *right = path->nodes[0];
1671 struct extent_buffer *left;
Chris Masonbe0e5c02007-01-26 15:51:26 -05001672 int slot;
1673 int i;
1674 int free_space;
1675 int push_space = 0;
1676 int push_items = 0;
Chris Mason0783fcf2007-03-12 20:12:07 -04001677 struct btrfs_item *item;
Chris Mason7518a232007-03-12 12:01:18 -04001678 u32 old_left_nritems;
Chris Mason5f39d392007-10-15 16:14:19 -04001679 u32 right_nritems;
Chris Mason34a38212007-11-07 13:31:03 -05001680 u32 nr;
Chris Masonaa5d6be2007-02-28 16:35:06 -05001681 int ret = 0;
1682 int wret;
Chris Masondb945352007-10-15 16:15:53 -04001683 u32 this_item_size;
1684 u32 old_left_item_size;
Chris Masonbe0e5c02007-01-26 15:51:26 -05001685
1686 slot = path->slots[1];
Chris Mason5f39d392007-10-15 16:14:19 -04001687 if (slot == 0)
Chris Masonbe0e5c02007-01-26 15:51:26 -05001688 return 1;
Chris Mason5f39d392007-10-15 16:14:19 -04001689 if (!path->nodes[1])
Chris Masonbe0e5c02007-01-26 15:51:26 -05001690 return 1;
Chris Mason5f39d392007-10-15 16:14:19 -04001691
Chris Mason3685f792007-10-19 09:23:27 -04001692 right_nritems = btrfs_header_nritems(right);
1693 if (right_nritems == 0) {
1694 return 1;
1695 }
1696
Chris Mason5f39d392007-10-15 16:14:19 -04001697 left = read_tree_block(root, btrfs_node_blockptr(path->nodes[1],
Chris Masondb945352007-10-15 16:15:53 -04001698 slot - 1), root->leafsize);
Chris Mason123abc82007-03-14 14:14:43 -04001699 free_space = btrfs_leaf_free_space(root, left);
Chris Mason0783fcf2007-03-12 20:12:07 -04001700 if (free_space < data_size + sizeof(struct btrfs_item)) {
Chris Mason5f39d392007-10-15 16:14:19 -04001701 free_extent_buffer(left);
Chris Masonbe0e5c02007-01-26 15:51:26 -05001702 return 1;
1703 }
Chris Mason02217ed2007-03-02 16:08:05 -05001704
1705 /* cow and double check */
Chris Mason5f39d392007-10-15 16:14:19 -04001706 ret = btrfs_cow_block(trans, root, left,
1707 path->nodes[1], slot - 1, &left);
Chris Mason54aa1f42007-06-22 14:16:25 -04001708 if (ret) {
1709 /* we hit -ENOSPC, but it isn't fatal here */
Chris Mason5f39d392007-10-15 16:14:19 -04001710 free_extent_buffer(left);
Chris Mason54aa1f42007-06-22 14:16:25 -04001711 return 1;
1712 }
Chris Mason3685f792007-10-19 09:23:27 -04001713
Chris Mason123abc82007-03-14 14:14:43 -04001714 free_space = btrfs_leaf_free_space(root, left);
Chris Mason0783fcf2007-03-12 20:12:07 -04001715 if (free_space < data_size + sizeof(struct btrfs_item)) {
Chris Mason5f39d392007-10-15 16:14:19 -04001716 free_extent_buffer(left);
Chris Mason02217ed2007-03-02 16:08:05 -05001717 return 1;
1718 }
1719
Chris Mason34a38212007-11-07 13:31:03 -05001720 if (empty)
1721 nr = right_nritems;
1722 else
1723 nr = right_nritems - 1;
1724
1725 for (i = 0; i < nr; i++) {
Chris Mason5f39d392007-10-15 16:14:19 -04001726 item = btrfs_item_nr(right, i);
Chris Masondb945352007-10-15 16:15:53 -04001727 if (!right->map_token) {
1728 map_extent_buffer(right, (unsigned long)item,
1729 sizeof(struct btrfs_item),
1730 &right->map_token, &right->kaddr,
1731 &right->map_start, &right->map_len,
1732 KM_USER1);
1733 }
1734
Chris Masonbe0e5c02007-01-26 15:51:26 -05001735 if (path->slots[0] == i)
1736 push_space += data_size + sizeof(*item);
Chris Masondb945352007-10-15 16:15:53 -04001737
1738 this_item_size = btrfs_item_size(right, item);
1739 if (this_item_size + sizeof(*item) + push_space > free_space)
Chris Masonbe0e5c02007-01-26 15:51:26 -05001740 break;
Chris Masondb945352007-10-15 16:15:53 -04001741
Chris Masonbe0e5c02007-01-26 15:51:26 -05001742 push_items++;
Chris Masondb945352007-10-15 16:15:53 -04001743 push_space += this_item_size + sizeof(*item);
Chris Masonbe0e5c02007-01-26 15:51:26 -05001744 }
Chris Masondb945352007-10-15 16:15:53 -04001745
1746 if (right->map_token) {
1747 unmap_extent_buffer(right, right->map_token, KM_USER1);
1748 right->map_token = NULL;
1749 }
1750
Chris Masonbe0e5c02007-01-26 15:51:26 -05001751 if (push_items == 0) {
Chris Mason5f39d392007-10-15 16:14:19 -04001752 free_extent_buffer(left);
Chris Masonbe0e5c02007-01-26 15:51:26 -05001753 return 1;
1754 }
Chris Mason34a38212007-11-07 13:31:03 -05001755 if (!empty && push_items == btrfs_header_nritems(right))
Chris Masona429e512007-04-18 16:15:28 -04001756 WARN_ON(1);
Chris Mason5f39d392007-10-15 16:14:19 -04001757
Chris Masonbe0e5c02007-01-26 15:51:26 -05001758 /* push data from right to left */
Chris Mason5f39d392007-10-15 16:14:19 -04001759 copy_extent_buffer(left, right,
1760 btrfs_item_nr_offset(btrfs_header_nritems(left)),
1761 btrfs_item_nr_offset(0),
1762 push_items * sizeof(struct btrfs_item));
1763
Chris Mason123abc82007-03-14 14:14:43 -04001764 push_space = BTRFS_LEAF_DATA_SIZE(root) -
Chris Mason5f39d392007-10-15 16:14:19 -04001765 btrfs_item_offset_nr(right, push_items -1);
1766
1767 copy_extent_buffer(left, right, btrfs_leaf_data(left) +
Chris Masond6025572007-03-30 14:27:56 -04001768 leaf_data_end(root, left) - push_space,
1769 btrfs_leaf_data(right) +
Chris Mason5f39d392007-10-15 16:14:19 -04001770 btrfs_item_offset_nr(right, push_items - 1),
Chris Masond6025572007-03-30 14:27:56 -04001771 push_space);
Chris Mason5f39d392007-10-15 16:14:19 -04001772 old_left_nritems = btrfs_header_nritems(left);
Chris Masoneb60cea2007-02-02 09:18:22 -05001773 BUG_ON(old_left_nritems < 0);
1774
Chris Masondb945352007-10-15 16:15:53 -04001775 old_left_item_size = btrfs_item_offset_nr(left, old_left_nritems - 1);
Chris Mason0783fcf2007-03-12 20:12:07 -04001776 for (i = old_left_nritems; i < old_left_nritems + push_items; i++) {
Chris Mason5f39d392007-10-15 16:14:19 -04001777 u32 ioff;
Chris Masondb945352007-10-15 16:15:53 -04001778
Chris Mason5f39d392007-10-15 16:14:19 -04001779 item = btrfs_item_nr(left, i);
Chris Masondb945352007-10-15 16:15:53 -04001780 if (!left->map_token) {
1781 map_extent_buffer(left, (unsigned long)item,
1782 sizeof(struct btrfs_item),
1783 &left->map_token, &left->kaddr,
1784 &left->map_start, &left->map_len,
1785 KM_USER1);
1786 }
1787
Chris Mason5f39d392007-10-15 16:14:19 -04001788 ioff = btrfs_item_offset(left, item);
1789 btrfs_set_item_offset(left, item,
Chris Masondb945352007-10-15 16:15:53 -04001790 ioff - (BTRFS_LEAF_DATA_SIZE(root) - old_left_item_size));
Chris Masonbe0e5c02007-01-26 15:51:26 -05001791 }
Chris Mason5f39d392007-10-15 16:14:19 -04001792 btrfs_set_header_nritems(left, old_left_nritems + push_items);
Chris Masondb945352007-10-15 16:15:53 -04001793 if (left->map_token) {
1794 unmap_extent_buffer(left, left->map_token, KM_USER1);
1795 left->map_token = NULL;
1796 }
Chris Masonbe0e5c02007-01-26 15:51:26 -05001797
1798 /* fixup right node */
Chris Mason34a38212007-11-07 13:31:03 -05001799 if (push_items > right_nritems) {
1800 printk("push items %d nr %u\n", push_items, right_nritems);
1801 WARN_ON(1);
1802 }
Chris Mason5f39d392007-10-15 16:14:19 -04001803
Chris Mason34a38212007-11-07 13:31:03 -05001804 if (push_items < right_nritems) {
1805 push_space = btrfs_item_offset_nr(right, push_items - 1) -
1806 leaf_data_end(root, right);
1807 memmove_extent_buffer(right, btrfs_leaf_data(right) +
1808 BTRFS_LEAF_DATA_SIZE(root) - push_space,
1809 btrfs_leaf_data(right) +
1810 leaf_data_end(root, right), push_space);
1811
1812 memmove_extent_buffer(right, btrfs_item_nr_offset(0),
Chris Mason5f39d392007-10-15 16:14:19 -04001813 btrfs_item_nr_offset(push_items),
1814 (btrfs_header_nritems(right) - push_items) *
1815 sizeof(struct btrfs_item));
Chris Mason34a38212007-11-07 13:31:03 -05001816 }
Yaneef1c492007-11-26 10:58:13 -05001817 right_nritems -= push_items;
1818 btrfs_set_header_nritems(right, right_nritems);
Chris Mason123abc82007-03-14 14:14:43 -04001819 push_space = BTRFS_LEAF_DATA_SIZE(root);
Chris Mason5f39d392007-10-15 16:14:19 -04001820 for (i = 0; i < right_nritems; i++) {
1821 item = btrfs_item_nr(right, i);
Chris Masondb945352007-10-15 16:15:53 -04001822
1823 if (!right->map_token) {
1824 map_extent_buffer(right, (unsigned long)item,
1825 sizeof(struct btrfs_item),
1826 &right->map_token, &right->kaddr,
1827 &right->map_start, &right->map_len,
1828 KM_USER1);
1829 }
1830
1831 push_space = push_space - btrfs_item_size(right, item);
1832 btrfs_set_item_offset(right, item, push_space);
1833 }
1834 if (right->map_token) {
1835 unmap_extent_buffer(right, right->map_token, KM_USER1);
1836 right->map_token = NULL;
Chris Masonbe0e5c02007-01-26 15:51:26 -05001837 }
Chris Masoneb60cea2007-02-02 09:18:22 -05001838
Chris Mason5f39d392007-10-15 16:14:19 -04001839 btrfs_mark_buffer_dirty(left);
Chris Mason34a38212007-11-07 13:31:03 -05001840 if (right_nritems)
1841 btrfs_mark_buffer_dirty(right);
Chris Mason098f59c2007-05-11 11:33:21 -04001842
Chris Mason5f39d392007-10-15 16:14:19 -04001843 btrfs_item_key(right, &disk_key, 0);
1844 wret = fixup_low_keys(trans, root, path, &disk_key, 1);
Chris Masonaa5d6be2007-02-28 16:35:06 -05001845 if (wret)
1846 ret = wret;
Chris Masonbe0e5c02007-01-26 15:51:26 -05001847
1848 /* then fixup the leaf pointer in the path */
1849 if (path->slots[0] < push_items) {
1850 path->slots[0] += old_left_nritems;
Chris Mason5f39d392007-10-15 16:14:19 -04001851 free_extent_buffer(path->nodes[0]);
1852 path->nodes[0] = left;
Chris Masonbe0e5c02007-01-26 15:51:26 -05001853 path->slots[1] -= 1;
1854 } else {
Chris Mason5f39d392007-10-15 16:14:19 -04001855 free_extent_buffer(left);
Chris Masonbe0e5c02007-01-26 15:51:26 -05001856 path->slots[0] -= push_items;
1857 }
Chris Masoneb60cea2007-02-02 09:18:22 -05001858 BUG_ON(path->slots[0] < 0);
Chris Masonaa5d6be2007-02-28 16:35:06 -05001859 return ret;
Chris Masonbe0e5c02007-01-26 15:51:26 -05001860}
1861
Chris Mason74123bd2007-02-02 11:05:29 -05001862/*
1863 * split the path's leaf in two, making sure there is at least data_size
1864 * available for the resulting leaf level of the path.
Chris Masonaa5d6be2007-02-28 16:35:06 -05001865 *
1866 * returns 0 if all went well and < 0 on failure.
Chris Mason74123bd2007-02-02 11:05:29 -05001867 */
Chris Masone089f052007-03-16 16:20:31 -04001868static int split_leaf(struct btrfs_trans_handle *trans, struct btrfs_root
Chris Masond4dbff92007-04-04 14:08:15 -04001869 *root, struct btrfs_key *ins_key,
Chris Masoncc0c5532007-10-25 15:42:57 -04001870 struct btrfs_path *path, int data_size, int extend)
Chris Masonbe0e5c02007-01-26 15:51:26 -05001871{
Chris Mason7bb86312007-12-11 09:25:06 -05001872 u64 root_gen;
Chris Mason5f39d392007-10-15 16:14:19 -04001873 struct extent_buffer *l;
Chris Mason7518a232007-03-12 12:01:18 -04001874 u32 nritems;
Chris Masoneb60cea2007-02-02 09:18:22 -05001875 int mid;
1876 int slot;
Chris Mason5f39d392007-10-15 16:14:19 -04001877 struct extent_buffer *right;
Chris Mason0783fcf2007-03-12 20:12:07 -04001878 int space_needed = data_size + sizeof(struct btrfs_item);
Chris Masonbe0e5c02007-01-26 15:51:26 -05001879 int data_copy_size;
1880 int rt_data_off;
1881 int i;
Chris Masond4dbff92007-04-04 14:08:15 -04001882 int ret = 0;
Chris Masonaa5d6be2007-02-28 16:35:06 -05001883 int wret;
Chris Masoncc0c5532007-10-25 15:42:57 -04001884 int double_split;
1885 int num_doubles = 0;
Chris Masond4dbff92007-04-04 14:08:15 -04001886 struct btrfs_disk_key disk_key;
Chris Masonbe0e5c02007-01-26 15:51:26 -05001887
Chris Masoncc0c5532007-10-25 15:42:57 -04001888 if (extend)
1889 space_needed = data_size;
1890
Chris Mason7bb86312007-12-11 09:25:06 -05001891 if (root->ref_cows)
1892 root_gen = trans->transid;
1893 else
1894 root_gen = 0;
1895
Chris Mason40689472007-03-17 14:29:23 -04001896 /* first try to make some room by pushing left and right */
Chris Mason3685f792007-10-19 09:23:27 -04001897 if (ins_key->type != BTRFS_DIR_ITEM_KEY) {
Chris Mason34a38212007-11-07 13:31:03 -05001898 wret = push_leaf_right(trans, root, path, data_size, 0);
Chris Mason3685f792007-10-19 09:23:27 -04001899 if (wret < 0) {
Chris Masoneaee50e2007-03-13 11:17:52 -04001900 return wret;
Chris Mason3685f792007-10-19 09:23:27 -04001901 }
1902 if (wret) {
Chris Mason34a38212007-11-07 13:31:03 -05001903 wret = push_leaf_left(trans, root, path, data_size, 0);
Chris Mason3685f792007-10-19 09:23:27 -04001904 if (wret < 0)
1905 return wret;
1906 }
1907 l = path->nodes[0];
Chris Masonaa5d6be2007-02-28 16:35:06 -05001908
Chris Mason3685f792007-10-19 09:23:27 -04001909 /* did the pushes work? */
Chris Masoncc0c5532007-10-25 15:42:57 -04001910 if (btrfs_leaf_free_space(root, l) >= space_needed)
Chris Mason3685f792007-10-19 09:23:27 -04001911 return 0;
Chris Mason3326d1b2007-10-15 16:18:25 -04001912 }
Chris Masonaa5d6be2007-02-28 16:35:06 -05001913
Chris Mason5c680ed2007-02-22 11:39:13 -05001914 if (!path->nodes[1]) {
Chris Masone089f052007-03-16 16:20:31 -04001915 ret = insert_new_root(trans, root, path, 1);
Chris Mason5c680ed2007-02-22 11:39:13 -05001916 if (ret)
1917 return ret;
1918 }
Chris Masoncc0c5532007-10-25 15:42:57 -04001919again:
1920 double_split = 0;
1921 l = path->nodes[0];
Chris Masoneb60cea2007-02-02 09:18:22 -05001922 slot = path->slots[0];
Chris Mason5f39d392007-10-15 16:14:19 -04001923 nritems = btrfs_header_nritems(l);
Chris Masoneb60cea2007-02-02 09:18:22 -05001924 mid = (nritems + 1)/ 2;
Chris Mason54aa1f42007-06-22 14:16:25 -04001925
Chris Mason7bb86312007-12-11 09:25:06 -05001926 btrfs_item_key(l, &disk_key, 0);
1927
1928 right = __btrfs_alloc_free_block(trans, root, root->leafsize,
1929 root->root_key.objectid,
1930 root_gen, disk_key.objectid, 0,
1931 l->start, 0);
Chris Mason5f39d392007-10-15 16:14:19 -04001932 if (IS_ERR(right))
1933 return PTR_ERR(right);
Chris Mason54aa1f42007-06-22 14:16:25 -04001934
Chris Mason5f39d392007-10-15 16:14:19 -04001935 memset_extent_buffer(right, 0, 0, sizeof(struct btrfs_header));
Chris Masondb945352007-10-15 16:15:53 -04001936 btrfs_set_header_bytenr(right, right->start);
Chris Mason5f39d392007-10-15 16:14:19 -04001937 btrfs_set_header_generation(right, trans->transid);
1938 btrfs_set_header_owner(right, root->root_key.objectid);
1939 btrfs_set_header_level(right, 0);
1940 write_extent_buffer(right, root->fs_info->fsid,
1941 (unsigned long)btrfs_header_fsid(right),
1942 BTRFS_FSID_SIZE);
Chris Masond4dbff92007-04-04 14:08:15 -04001943 if (mid <= slot) {
1944 if (nritems == 1 ||
1945 leaf_space_used(l, mid, nritems - mid) + space_needed >
1946 BTRFS_LEAF_DATA_SIZE(root)) {
1947 if (slot >= nritems) {
1948 btrfs_cpu_key_to_disk(&disk_key, ins_key);
Chris Mason5f39d392007-10-15 16:14:19 -04001949 btrfs_set_header_nritems(right, 0);
Chris Masond4dbff92007-04-04 14:08:15 -04001950 wret = insert_ptr(trans, root, path,
Chris Masondb945352007-10-15 16:15:53 -04001951 &disk_key, right->start,
Chris Masond4dbff92007-04-04 14:08:15 -04001952 path->slots[1] + 1, 1);
1953 if (wret)
1954 ret = wret;
Chris Mason5f39d392007-10-15 16:14:19 -04001955 free_extent_buffer(path->nodes[0]);
1956 path->nodes[0] = right;
Chris Masond4dbff92007-04-04 14:08:15 -04001957 path->slots[0] = 0;
1958 path->slots[1] += 1;
1959 return ret;
1960 }
1961 mid = slot;
Chris Mason3326d1b2007-10-15 16:18:25 -04001962 if (mid != nritems &&
1963 leaf_space_used(l, mid, nritems - mid) +
1964 space_needed > BTRFS_LEAF_DATA_SIZE(root)) {
1965 double_split = 1;
1966 }
Chris Masond4dbff92007-04-04 14:08:15 -04001967 }
1968 } else {
1969 if (leaf_space_used(l, 0, mid + 1) + space_needed >
1970 BTRFS_LEAF_DATA_SIZE(root)) {
Chris Masoncc0c5532007-10-25 15:42:57 -04001971 if (!extend && slot == 0) {
Chris Masond4dbff92007-04-04 14:08:15 -04001972 btrfs_cpu_key_to_disk(&disk_key, ins_key);
Chris Mason5f39d392007-10-15 16:14:19 -04001973 btrfs_set_header_nritems(right, 0);
Chris Masond4dbff92007-04-04 14:08:15 -04001974 wret = insert_ptr(trans, root, path,
1975 &disk_key,
Chris Masondb945352007-10-15 16:15:53 -04001976 right->start,
Chris Mason098f59c2007-05-11 11:33:21 -04001977 path->slots[1], 1);
Chris Masond4dbff92007-04-04 14:08:15 -04001978 if (wret)
1979 ret = wret;
Chris Mason5f39d392007-10-15 16:14:19 -04001980 free_extent_buffer(path->nodes[0]);
1981 path->nodes[0] = right;
Chris Masond4dbff92007-04-04 14:08:15 -04001982 path->slots[0] = 0;
Chris Masona429e512007-04-18 16:15:28 -04001983 if (path->slots[1] == 0) {
1984 wret = fixup_low_keys(trans, root,
1985 path, &disk_key, 1);
1986 if (wret)
1987 ret = wret;
1988 }
Chris Masond4dbff92007-04-04 14:08:15 -04001989 return ret;
Chris Masoncc0c5532007-10-25 15:42:57 -04001990 } else if (extend && slot == 0) {
1991 mid = 1;
1992 } else {
1993 mid = slot;
1994 if (mid != nritems &&
1995 leaf_space_used(l, mid, nritems - mid) +
1996 space_needed > BTRFS_LEAF_DATA_SIZE(root)) {
1997 double_split = 1;
1998 }
Chris Mason5ee78ac2007-10-19 14:01:21 -04001999 }
Chris Masond4dbff92007-04-04 14:08:15 -04002000 }
2001 }
Chris Mason5f39d392007-10-15 16:14:19 -04002002 nritems = nritems - mid;
2003 btrfs_set_header_nritems(right, nritems);
2004 data_copy_size = btrfs_item_end_nr(l, mid) - leaf_data_end(root, l);
2005
2006 copy_extent_buffer(right, l, btrfs_item_nr_offset(0),
2007 btrfs_item_nr_offset(mid),
2008 nritems * sizeof(struct btrfs_item));
2009
2010 copy_extent_buffer(right, l,
Chris Masond6025572007-03-30 14:27:56 -04002011 btrfs_leaf_data(right) + BTRFS_LEAF_DATA_SIZE(root) -
2012 data_copy_size, btrfs_leaf_data(l) +
2013 leaf_data_end(root, l), data_copy_size);
Chris Mason74123bd2007-02-02 11:05:29 -05002014
Chris Mason5f39d392007-10-15 16:14:19 -04002015 rt_data_off = BTRFS_LEAF_DATA_SIZE(root) -
2016 btrfs_item_end_nr(l, mid);
2017
2018 for (i = 0; i < nritems; i++) {
2019 struct btrfs_item *item = btrfs_item_nr(right, i);
Chris Masondb945352007-10-15 16:15:53 -04002020 u32 ioff;
2021
2022 if (!right->map_token) {
2023 map_extent_buffer(right, (unsigned long)item,
2024 sizeof(struct btrfs_item),
2025 &right->map_token, &right->kaddr,
2026 &right->map_start, &right->map_len,
2027 KM_USER1);
2028 }
2029
2030 ioff = btrfs_item_offset(right, item);
Chris Mason5f39d392007-10-15 16:14:19 -04002031 btrfs_set_item_offset(right, item, ioff + rt_data_off);
Chris Mason0783fcf2007-03-12 20:12:07 -04002032 }
Chris Mason74123bd2007-02-02 11:05:29 -05002033
Chris Masondb945352007-10-15 16:15:53 -04002034 if (right->map_token) {
2035 unmap_extent_buffer(right, right->map_token, KM_USER1);
2036 right->map_token = NULL;
2037 }
2038
Chris Mason5f39d392007-10-15 16:14:19 -04002039 btrfs_set_header_nritems(l, mid);
Chris Masonaa5d6be2007-02-28 16:35:06 -05002040 ret = 0;
Chris Mason5f39d392007-10-15 16:14:19 -04002041 btrfs_item_key(right, &disk_key, 0);
Chris Masondb945352007-10-15 16:15:53 -04002042 wret = insert_ptr(trans, root, path, &disk_key, right->start,
2043 path->slots[1] + 1, 1);
Chris Masonaa5d6be2007-02-28 16:35:06 -05002044 if (wret)
2045 ret = wret;
Chris Mason5f39d392007-10-15 16:14:19 -04002046
2047 btrfs_mark_buffer_dirty(right);
2048 btrfs_mark_buffer_dirty(l);
Chris Masoneb60cea2007-02-02 09:18:22 -05002049 BUG_ON(path->slots[0] != slot);
Chris Mason5f39d392007-10-15 16:14:19 -04002050
Chris Masonbe0e5c02007-01-26 15:51:26 -05002051 if (mid <= slot) {
Chris Mason5f39d392007-10-15 16:14:19 -04002052 free_extent_buffer(path->nodes[0]);
2053 path->nodes[0] = right;
Chris Masonbe0e5c02007-01-26 15:51:26 -05002054 path->slots[0] -= mid;
2055 path->slots[1] += 1;
Chris Masoneb60cea2007-02-02 09:18:22 -05002056 } else
Chris Mason5f39d392007-10-15 16:14:19 -04002057 free_extent_buffer(right);
2058
Chris Masoneb60cea2007-02-02 09:18:22 -05002059 BUG_ON(path->slots[0] < 0);
Chris Masond4dbff92007-04-04 14:08:15 -04002060
Chris Masoncc0c5532007-10-25 15:42:57 -04002061 if (double_split) {
2062 BUG_ON(num_doubles != 0);
2063 num_doubles++;
2064 goto again;
Chris Mason3326d1b2007-10-15 16:18:25 -04002065 }
Chris Masonbe0e5c02007-01-26 15:51:26 -05002066 return ret;
2067}
2068
Chris Masonb18c6682007-04-17 13:26:50 -04002069int btrfs_truncate_item(struct btrfs_trans_handle *trans,
2070 struct btrfs_root *root,
2071 struct btrfs_path *path,
Chris Mason179e29e2007-11-01 11:28:41 -04002072 u32 new_size, int from_end)
Chris Masonb18c6682007-04-17 13:26:50 -04002073{
2074 int ret = 0;
2075 int slot;
2076 int slot_orig;
Chris Mason5f39d392007-10-15 16:14:19 -04002077 struct extent_buffer *leaf;
2078 struct btrfs_item *item;
Chris Masonb18c6682007-04-17 13:26:50 -04002079 u32 nritems;
2080 unsigned int data_end;
2081 unsigned int old_data_start;
2082 unsigned int old_size;
2083 unsigned int size_diff;
2084 int i;
2085
2086 slot_orig = path->slots[0];
Chris Mason5f39d392007-10-15 16:14:19 -04002087 leaf = path->nodes[0];
Chris Mason179e29e2007-11-01 11:28:41 -04002088 slot = path->slots[0];
2089
2090 old_size = btrfs_item_size_nr(leaf, slot);
2091 if (old_size == new_size)
2092 return 0;
Chris Masonb18c6682007-04-17 13:26:50 -04002093
Chris Mason5f39d392007-10-15 16:14:19 -04002094 nritems = btrfs_header_nritems(leaf);
Chris Masonb18c6682007-04-17 13:26:50 -04002095 data_end = leaf_data_end(root, leaf);
2096
Chris Mason5f39d392007-10-15 16:14:19 -04002097 old_data_start = btrfs_item_offset_nr(leaf, slot);
Chris Mason179e29e2007-11-01 11:28:41 -04002098
Chris Masonb18c6682007-04-17 13:26:50 -04002099 size_diff = old_size - new_size;
2100
2101 BUG_ON(slot < 0);
2102 BUG_ON(slot >= nritems);
2103
2104 /*
2105 * item0..itemN ... dataN.offset..dataN.size .. data0.size
2106 */
2107 /* first correct the data pointers */
2108 for (i = slot; i < nritems; i++) {
Chris Mason5f39d392007-10-15 16:14:19 -04002109 u32 ioff;
2110 item = btrfs_item_nr(leaf, i);
Chris Masondb945352007-10-15 16:15:53 -04002111
2112 if (!leaf->map_token) {
2113 map_extent_buffer(leaf, (unsigned long)item,
2114 sizeof(struct btrfs_item),
2115 &leaf->map_token, &leaf->kaddr,
2116 &leaf->map_start, &leaf->map_len,
2117 KM_USER1);
2118 }
2119
Chris Mason5f39d392007-10-15 16:14:19 -04002120 ioff = btrfs_item_offset(leaf, item);
2121 btrfs_set_item_offset(leaf, item, ioff + size_diff);
Chris Masonb18c6682007-04-17 13:26:50 -04002122 }
Chris Masondb945352007-10-15 16:15:53 -04002123
2124 if (leaf->map_token) {
2125 unmap_extent_buffer(leaf, leaf->map_token, KM_USER1);
2126 leaf->map_token = NULL;
2127 }
2128
Chris Masonb18c6682007-04-17 13:26:50 -04002129 /* shift the data */
Chris Mason179e29e2007-11-01 11:28:41 -04002130 if (from_end) {
2131 memmove_extent_buffer(leaf, btrfs_leaf_data(leaf) +
2132 data_end + size_diff, btrfs_leaf_data(leaf) +
2133 data_end, old_data_start + new_size - data_end);
2134 } else {
2135 struct btrfs_disk_key disk_key;
2136 u64 offset;
2137
2138 btrfs_item_key(leaf, &disk_key, slot);
2139
2140 if (btrfs_disk_key_type(&disk_key) == BTRFS_EXTENT_DATA_KEY) {
2141 unsigned long ptr;
2142 struct btrfs_file_extent_item *fi;
2143
2144 fi = btrfs_item_ptr(leaf, slot,
2145 struct btrfs_file_extent_item);
2146 fi = (struct btrfs_file_extent_item *)(
2147 (unsigned long)fi - size_diff);
2148
2149 if (btrfs_file_extent_type(leaf, fi) ==
2150 BTRFS_FILE_EXTENT_INLINE) {
2151 ptr = btrfs_item_ptr_offset(leaf, slot);
2152 memmove_extent_buffer(leaf, ptr,
2153 (unsigned long)fi,
2154 offsetof(struct btrfs_file_extent_item,
2155 disk_bytenr));
2156 }
2157 }
2158
2159 memmove_extent_buffer(leaf, btrfs_leaf_data(leaf) +
2160 data_end + size_diff, btrfs_leaf_data(leaf) +
2161 data_end, old_data_start - data_end);
2162
2163 offset = btrfs_disk_key_offset(&disk_key);
2164 btrfs_set_disk_key_offset(&disk_key, offset + size_diff);
2165 btrfs_set_item_key(leaf, &disk_key, slot);
2166 if (slot == 0)
2167 fixup_low_keys(trans, root, path, &disk_key, 1);
2168 }
Chris Mason5f39d392007-10-15 16:14:19 -04002169
2170 item = btrfs_item_nr(leaf, slot);
2171 btrfs_set_item_size(leaf, item, new_size);
2172 btrfs_mark_buffer_dirty(leaf);
Chris Masonb18c6682007-04-17 13:26:50 -04002173
2174 ret = 0;
Chris Mason5f39d392007-10-15 16:14:19 -04002175 if (btrfs_leaf_free_space(root, leaf) < 0) {
2176 btrfs_print_leaf(root, leaf);
Chris Masonb18c6682007-04-17 13:26:50 -04002177 BUG();
Chris Mason5f39d392007-10-15 16:14:19 -04002178 }
Chris Masonb18c6682007-04-17 13:26:50 -04002179 return ret;
2180}
2181
Chris Mason5f39d392007-10-15 16:14:19 -04002182int btrfs_extend_item(struct btrfs_trans_handle *trans,
2183 struct btrfs_root *root, struct btrfs_path *path,
2184 u32 data_size)
Chris Mason6567e832007-04-16 09:22:45 -04002185{
2186 int ret = 0;
2187 int slot;
2188 int slot_orig;
Chris Mason5f39d392007-10-15 16:14:19 -04002189 struct extent_buffer *leaf;
2190 struct btrfs_item *item;
Chris Mason6567e832007-04-16 09:22:45 -04002191 u32 nritems;
2192 unsigned int data_end;
2193 unsigned int old_data;
2194 unsigned int old_size;
2195 int i;
2196
2197 slot_orig = path->slots[0];
Chris Mason5f39d392007-10-15 16:14:19 -04002198 leaf = path->nodes[0];
Chris Mason6567e832007-04-16 09:22:45 -04002199
Chris Mason5f39d392007-10-15 16:14:19 -04002200 nritems = btrfs_header_nritems(leaf);
Chris Mason6567e832007-04-16 09:22:45 -04002201 data_end = leaf_data_end(root, leaf);
2202
Chris Mason5f39d392007-10-15 16:14:19 -04002203 if (btrfs_leaf_free_space(root, leaf) < data_size) {
2204 btrfs_print_leaf(root, leaf);
Chris Mason6567e832007-04-16 09:22:45 -04002205 BUG();
Chris Mason5f39d392007-10-15 16:14:19 -04002206 }
Chris Mason6567e832007-04-16 09:22:45 -04002207 slot = path->slots[0];
Chris Mason5f39d392007-10-15 16:14:19 -04002208 old_data = btrfs_item_end_nr(leaf, slot);
Chris Mason6567e832007-04-16 09:22:45 -04002209
2210 BUG_ON(slot < 0);
Chris Mason3326d1b2007-10-15 16:18:25 -04002211 if (slot >= nritems) {
2212 btrfs_print_leaf(root, leaf);
2213 printk("slot %d too large, nritems %d\n", slot, nritems);
2214 BUG_ON(1);
2215 }
Chris Mason6567e832007-04-16 09:22:45 -04002216
2217 /*
2218 * item0..itemN ... dataN.offset..dataN.size .. data0.size
2219 */
2220 /* first correct the data pointers */
2221 for (i = slot; i < nritems; i++) {
Chris Mason5f39d392007-10-15 16:14:19 -04002222 u32 ioff;
2223 item = btrfs_item_nr(leaf, i);
Chris Masondb945352007-10-15 16:15:53 -04002224
2225 if (!leaf->map_token) {
2226 map_extent_buffer(leaf, (unsigned long)item,
2227 sizeof(struct btrfs_item),
2228 &leaf->map_token, &leaf->kaddr,
2229 &leaf->map_start, &leaf->map_len,
2230 KM_USER1);
2231 }
Chris Mason5f39d392007-10-15 16:14:19 -04002232 ioff = btrfs_item_offset(leaf, item);
2233 btrfs_set_item_offset(leaf, item, ioff - data_size);
Chris Mason6567e832007-04-16 09:22:45 -04002234 }
Chris Mason5f39d392007-10-15 16:14:19 -04002235
Chris Masondb945352007-10-15 16:15:53 -04002236 if (leaf->map_token) {
2237 unmap_extent_buffer(leaf, leaf->map_token, KM_USER1);
2238 leaf->map_token = NULL;
2239 }
2240
Chris Mason6567e832007-04-16 09:22:45 -04002241 /* shift the data */
Chris Mason5f39d392007-10-15 16:14:19 -04002242 memmove_extent_buffer(leaf, btrfs_leaf_data(leaf) +
Chris Mason6567e832007-04-16 09:22:45 -04002243 data_end - data_size, btrfs_leaf_data(leaf) +
2244 data_end, old_data - data_end);
Chris Mason5f39d392007-10-15 16:14:19 -04002245
Chris Mason6567e832007-04-16 09:22:45 -04002246 data_end = old_data;
Chris Mason5f39d392007-10-15 16:14:19 -04002247 old_size = btrfs_item_size_nr(leaf, slot);
2248 item = btrfs_item_nr(leaf, slot);
2249 btrfs_set_item_size(leaf, item, old_size + data_size);
2250 btrfs_mark_buffer_dirty(leaf);
Chris Mason6567e832007-04-16 09:22:45 -04002251
2252 ret = 0;
Chris Mason5f39d392007-10-15 16:14:19 -04002253 if (btrfs_leaf_free_space(root, leaf) < 0) {
2254 btrfs_print_leaf(root, leaf);
Chris Mason6567e832007-04-16 09:22:45 -04002255 BUG();
Chris Mason5f39d392007-10-15 16:14:19 -04002256 }
Chris Mason6567e832007-04-16 09:22:45 -04002257 return ret;
2258}
2259
Chris Mason74123bd2007-02-02 11:05:29 -05002260/*
2261 * Given a key and some data, insert an item into the tree.
2262 * This does all the path init required, making room in the tree if needed.
2263 */
Chris Mason5f39d392007-10-15 16:14:19 -04002264int btrfs_insert_empty_item(struct btrfs_trans_handle *trans,
2265 struct btrfs_root *root,
2266 struct btrfs_path *path,
2267 struct btrfs_key *cpu_key, u32 data_size)
Chris Masonbe0e5c02007-01-26 15:51:26 -05002268{
Chris Mason5f39d392007-10-15 16:14:19 -04002269 struct extent_buffer *leaf;
2270 struct btrfs_item *item;
Chris Masonaa5d6be2007-02-28 16:35:06 -05002271 int ret = 0;
Chris Masonbe0e5c02007-01-26 15:51:26 -05002272 int slot;
Chris Masoneb60cea2007-02-02 09:18:22 -05002273 int slot_orig;
Chris Mason7518a232007-03-12 12:01:18 -04002274 u32 nritems;
Chris Masonbe0e5c02007-01-26 15:51:26 -05002275 unsigned int data_end;
Chris Masone2fa7222007-03-12 16:22:34 -04002276 struct btrfs_disk_key disk_key;
2277
2278 btrfs_cpu_key_to_disk(&disk_key, cpu_key);
Chris Masonbe0e5c02007-01-26 15:51:26 -05002279
Chris Mason74123bd2007-02-02 11:05:29 -05002280 /* create a root if there isn't one */
Chris Mason5c680ed2007-02-22 11:39:13 -05002281 if (!root->node)
Chris Masoncfaa7292007-02-21 17:04:57 -05002282 BUG();
Chris Mason5f39d392007-10-15 16:14:19 -04002283
Chris Masone089f052007-03-16 16:20:31 -04002284 ret = btrfs_search_slot(trans, root, cpu_key, path, data_size, 1);
Chris Masoneb60cea2007-02-02 09:18:22 -05002285 if (ret == 0) {
Chris Masonf0930a32007-03-02 09:47:58 -05002286 return -EEXIST;
Chris Masonaa5d6be2007-02-28 16:35:06 -05002287 }
Chris Masoned2ff2c2007-03-01 18:59:40 -05002288 if (ret < 0)
2289 goto out;
Chris Masonbe0e5c02007-01-26 15:51:26 -05002290
Chris Mason62e27492007-03-15 12:56:47 -04002291 slot_orig = path->slots[0];
Chris Mason5f39d392007-10-15 16:14:19 -04002292 leaf = path->nodes[0];
Chris Mason74123bd2007-02-02 11:05:29 -05002293
Chris Mason5f39d392007-10-15 16:14:19 -04002294 nritems = btrfs_header_nritems(leaf);
Chris Mason123abc82007-03-14 14:14:43 -04002295 data_end = leaf_data_end(root, leaf);
Chris Masoneb60cea2007-02-02 09:18:22 -05002296
Chris Mason123abc82007-03-14 14:14:43 -04002297 if (btrfs_leaf_free_space(root, leaf) <
Chris Masond4dbff92007-04-04 14:08:15 -04002298 sizeof(struct btrfs_item) + data_size) {
Chris Mason3326d1b2007-10-15 16:18:25 -04002299 btrfs_print_leaf(root, leaf);
2300 printk("not enough freespace need %u have %d\n",
2301 data_size, btrfs_leaf_free_space(root, leaf));
Chris Masonbe0e5c02007-01-26 15:51:26 -05002302 BUG();
Chris Masond4dbff92007-04-04 14:08:15 -04002303 }
Chris Mason5f39d392007-10-15 16:14:19 -04002304
Chris Mason62e27492007-03-15 12:56:47 -04002305 slot = path->slots[0];
Chris Masoneb60cea2007-02-02 09:18:22 -05002306 BUG_ON(slot < 0);
Chris Mason5f39d392007-10-15 16:14:19 -04002307
Chris Masonbe0e5c02007-01-26 15:51:26 -05002308 if (slot != nritems) {
2309 int i;
Chris Mason5f39d392007-10-15 16:14:19 -04002310 unsigned int old_data = btrfs_item_end_nr(leaf, slot);
Chris Masonbe0e5c02007-01-26 15:51:26 -05002311
Chris Mason5f39d392007-10-15 16:14:19 -04002312 if (old_data < data_end) {
2313 btrfs_print_leaf(root, leaf);
2314 printk("slot %d old_data %d data_end %d\n",
2315 slot, old_data, data_end);
2316 BUG_ON(1);
2317 }
Chris Masonbe0e5c02007-01-26 15:51:26 -05002318 /*
2319 * item0..itemN ... dataN.offset..dataN.size .. data0.size
2320 */
2321 /* first correct the data pointers */
Chris Masondb945352007-10-15 16:15:53 -04002322 WARN_ON(leaf->map_token);
Chris Mason0783fcf2007-03-12 20:12:07 -04002323 for (i = slot; i < nritems; i++) {
Chris Mason5f39d392007-10-15 16:14:19 -04002324 u32 ioff;
Chris Masondb945352007-10-15 16:15:53 -04002325
Chris Mason5f39d392007-10-15 16:14:19 -04002326 item = btrfs_item_nr(leaf, i);
Chris Masondb945352007-10-15 16:15:53 -04002327 if (!leaf->map_token) {
2328 map_extent_buffer(leaf, (unsigned long)item,
2329 sizeof(struct btrfs_item),
2330 &leaf->map_token, &leaf->kaddr,
2331 &leaf->map_start, &leaf->map_len,
2332 KM_USER1);
2333 }
2334
Chris Mason5f39d392007-10-15 16:14:19 -04002335 ioff = btrfs_item_offset(leaf, item);
2336 btrfs_set_item_offset(leaf, item, ioff - data_size);
Chris Mason0783fcf2007-03-12 20:12:07 -04002337 }
Chris Masondb945352007-10-15 16:15:53 -04002338 if (leaf->map_token) {
2339 unmap_extent_buffer(leaf, leaf->map_token, KM_USER1);
2340 leaf->map_token = NULL;
2341 }
Chris Masonbe0e5c02007-01-26 15:51:26 -05002342
2343 /* shift the items */
Chris Mason5f39d392007-10-15 16:14:19 -04002344 memmove_extent_buffer(leaf, btrfs_item_nr_offset(slot + 1),
2345 btrfs_item_nr_offset(slot),
Chris Masond6025572007-03-30 14:27:56 -04002346 (nritems - slot) * sizeof(struct btrfs_item));
Chris Masonbe0e5c02007-01-26 15:51:26 -05002347
2348 /* shift the data */
Chris Mason5f39d392007-10-15 16:14:19 -04002349 memmove_extent_buffer(leaf, btrfs_leaf_data(leaf) +
Chris Masond6025572007-03-30 14:27:56 -04002350 data_end - data_size, btrfs_leaf_data(leaf) +
2351 data_end, old_data - data_end);
Chris Masonbe0e5c02007-01-26 15:51:26 -05002352 data_end = old_data;
2353 }
Chris Mason5f39d392007-10-15 16:14:19 -04002354
Chris Mason62e27492007-03-15 12:56:47 -04002355 /* setup the item for the new data */
Chris Mason5f39d392007-10-15 16:14:19 -04002356 btrfs_set_item_key(leaf, &disk_key, slot);
2357 item = btrfs_item_nr(leaf, slot);
2358 btrfs_set_item_offset(leaf, item, data_end - data_size);
2359 btrfs_set_item_size(leaf, item, data_size);
2360 btrfs_set_header_nritems(leaf, nritems + 1);
2361 btrfs_mark_buffer_dirty(leaf);
Chris Masonaa5d6be2007-02-28 16:35:06 -05002362
2363 ret = 0;
Chris Mason8e19f2c2007-02-28 09:27:02 -05002364 if (slot == 0)
Chris Masone089f052007-03-16 16:20:31 -04002365 ret = fixup_low_keys(trans, root, path, &disk_key, 1);
Chris Masonaa5d6be2007-02-28 16:35:06 -05002366
Chris Mason5f39d392007-10-15 16:14:19 -04002367 if (btrfs_leaf_free_space(root, leaf) < 0) {
2368 btrfs_print_leaf(root, leaf);
Chris Masonbe0e5c02007-01-26 15:51:26 -05002369 BUG();
Chris Mason5f39d392007-10-15 16:14:19 -04002370 }
Chris Masoned2ff2c2007-03-01 18:59:40 -05002371out:
Chris Mason62e27492007-03-15 12:56:47 -04002372 return ret;
2373}
2374
2375/*
2376 * Given a key and some data, insert an item into the tree.
2377 * This does all the path init required, making room in the tree if needed.
2378 */
Chris Masone089f052007-03-16 16:20:31 -04002379int btrfs_insert_item(struct btrfs_trans_handle *trans, struct btrfs_root
2380 *root, struct btrfs_key *cpu_key, void *data, u32
2381 data_size)
Chris Mason62e27492007-03-15 12:56:47 -04002382{
2383 int ret = 0;
Chris Mason2c90e5d2007-04-02 10:50:19 -04002384 struct btrfs_path *path;
Chris Mason5f39d392007-10-15 16:14:19 -04002385 struct extent_buffer *leaf;
2386 unsigned long ptr;
Chris Mason62e27492007-03-15 12:56:47 -04002387
Chris Mason2c90e5d2007-04-02 10:50:19 -04002388 path = btrfs_alloc_path();
2389 BUG_ON(!path);
Chris Mason2c90e5d2007-04-02 10:50:19 -04002390 ret = btrfs_insert_empty_item(trans, root, path, cpu_key, data_size);
Chris Mason62e27492007-03-15 12:56:47 -04002391 if (!ret) {
Chris Mason5f39d392007-10-15 16:14:19 -04002392 leaf = path->nodes[0];
2393 ptr = btrfs_item_ptr_offset(leaf, path->slots[0]);
2394 write_extent_buffer(leaf, data, ptr, data_size);
2395 btrfs_mark_buffer_dirty(leaf);
Chris Mason62e27492007-03-15 12:56:47 -04002396 }
Chris Mason2c90e5d2007-04-02 10:50:19 -04002397 btrfs_free_path(path);
Chris Masonaa5d6be2007-02-28 16:35:06 -05002398 return ret;
Chris Masonbe0e5c02007-01-26 15:51:26 -05002399}
2400
Chris Mason74123bd2007-02-02 11:05:29 -05002401/*
Chris Mason5de08d72007-02-24 06:24:44 -05002402 * delete the pointer from a given node.
Chris Mason74123bd2007-02-02 11:05:29 -05002403 *
2404 * If the delete empties a node, the node is removed from the tree,
2405 * continuing all the way the root if required. The root is converted into
2406 * a leaf if all the nodes are emptied.
2407 */
Chris Masone089f052007-03-16 16:20:31 -04002408static int del_ptr(struct btrfs_trans_handle *trans, struct btrfs_root *root,
2409 struct btrfs_path *path, int level, int slot)
Chris Masonbe0e5c02007-01-26 15:51:26 -05002410{
Chris Mason5f39d392007-10-15 16:14:19 -04002411 struct extent_buffer *parent = path->nodes[level];
Chris Mason7518a232007-03-12 12:01:18 -04002412 u32 nritems;
Chris Masonaa5d6be2007-02-28 16:35:06 -05002413 int ret = 0;
Chris Masonbb803952007-03-01 12:04:21 -05002414 int wret;
Chris Masonbe0e5c02007-01-26 15:51:26 -05002415
Chris Mason5f39d392007-10-15 16:14:19 -04002416 nritems = btrfs_header_nritems(parent);
Chris Masonbb803952007-03-01 12:04:21 -05002417 if (slot != nritems -1) {
Chris Mason5f39d392007-10-15 16:14:19 -04002418 memmove_extent_buffer(parent,
2419 btrfs_node_key_ptr_offset(slot),
2420 btrfs_node_key_ptr_offset(slot + 1),
Chris Masond6025572007-03-30 14:27:56 -04002421 sizeof(struct btrfs_key_ptr) *
2422 (nritems - slot - 1));
Chris Masonbb803952007-03-01 12:04:21 -05002423 }
Chris Mason7518a232007-03-12 12:01:18 -04002424 nritems--;
Chris Mason5f39d392007-10-15 16:14:19 -04002425 btrfs_set_header_nritems(parent, nritems);
Chris Mason7518a232007-03-12 12:01:18 -04002426 if (nritems == 0 && parent == root->node) {
Chris Mason5f39d392007-10-15 16:14:19 -04002427 BUG_ON(btrfs_header_level(root->node) != 1);
Chris Masonbb803952007-03-01 12:04:21 -05002428 /* just turn the root into a leaf and break */
Chris Mason5f39d392007-10-15 16:14:19 -04002429 btrfs_set_header_level(root->node, 0);
Chris Masonbb803952007-03-01 12:04:21 -05002430 } else if (slot == 0) {
Chris Mason5f39d392007-10-15 16:14:19 -04002431 struct btrfs_disk_key disk_key;
2432
2433 btrfs_node_key(parent, &disk_key, 0);
2434 wret = fixup_low_keys(trans, root, path, &disk_key, level + 1);
Chris Mason0f70abe2007-02-28 16:46:22 -05002435 if (wret)
2436 ret = wret;
Chris Masonbe0e5c02007-01-26 15:51:26 -05002437 }
Chris Masond6025572007-03-30 14:27:56 -04002438 btrfs_mark_buffer_dirty(parent);
Chris Masonaa5d6be2007-02-28 16:35:06 -05002439 return ret;
Chris Masonbe0e5c02007-01-26 15:51:26 -05002440}
2441
Chris Mason74123bd2007-02-02 11:05:29 -05002442/*
2443 * delete the item at the leaf level in path. If that empties
2444 * the leaf, remove it from the tree
2445 */
Chris Masone089f052007-03-16 16:20:31 -04002446int btrfs_del_item(struct btrfs_trans_handle *trans, struct btrfs_root *root,
2447 struct btrfs_path *path)
Chris Masonbe0e5c02007-01-26 15:51:26 -05002448{
Chris Masonbe0e5c02007-01-26 15:51:26 -05002449 int slot;
Chris Mason5f39d392007-10-15 16:14:19 -04002450 struct extent_buffer *leaf;
2451 struct btrfs_item *item;
Chris Masonbe0e5c02007-01-26 15:51:26 -05002452 int doff;
2453 int dsize;
Chris Masonaa5d6be2007-02-28 16:35:06 -05002454 int ret = 0;
2455 int wret;
Chris Mason7518a232007-03-12 12:01:18 -04002456 u32 nritems;
Chris Masonbe0e5c02007-01-26 15:51:26 -05002457
Chris Mason5f39d392007-10-15 16:14:19 -04002458 leaf = path->nodes[0];
Chris Mason4920c9a2007-01-26 16:38:42 -05002459 slot = path->slots[0];
Chris Mason5f39d392007-10-15 16:14:19 -04002460 doff = btrfs_item_offset_nr(leaf, slot);
2461 dsize = btrfs_item_size_nr(leaf, slot);
2462 nritems = btrfs_header_nritems(leaf);
Chris Masonbe0e5c02007-01-26 15:51:26 -05002463
Chris Mason7518a232007-03-12 12:01:18 -04002464 if (slot != nritems - 1) {
Chris Masonbe0e5c02007-01-26 15:51:26 -05002465 int i;
Chris Mason123abc82007-03-14 14:14:43 -04002466 int data_end = leaf_data_end(root, leaf);
Chris Mason5f39d392007-10-15 16:14:19 -04002467
2468 memmove_extent_buffer(leaf, btrfs_leaf_data(leaf) +
Chris Masond6025572007-03-30 14:27:56 -04002469 data_end + dsize,
2470 btrfs_leaf_data(leaf) + data_end,
2471 doff - data_end);
Chris Mason5f39d392007-10-15 16:14:19 -04002472
Chris Mason0783fcf2007-03-12 20:12:07 -04002473 for (i = slot + 1; i < nritems; i++) {
Chris Mason5f39d392007-10-15 16:14:19 -04002474 u32 ioff;
Chris Masondb945352007-10-15 16:15:53 -04002475
Chris Mason5f39d392007-10-15 16:14:19 -04002476 item = btrfs_item_nr(leaf, i);
Chris Masondb945352007-10-15 16:15:53 -04002477 if (!leaf->map_token) {
2478 map_extent_buffer(leaf, (unsigned long)item,
2479 sizeof(struct btrfs_item),
2480 &leaf->map_token, &leaf->kaddr,
2481 &leaf->map_start, &leaf->map_len,
2482 KM_USER1);
2483 }
Chris Mason5f39d392007-10-15 16:14:19 -04002484 ioff = btrfs_item_offset(leaf, item);
2485 btrfs_set_item_offset(leaf, item, ioff + dsize);
Chris Mason0783fcf2007-03-12 20:12:07 -04002486 }
Chris Masondb945352007-10-15 16:15:53 -04002487
2488 if (leaf->map_token) {
2489 unmap_extent_buffer(leaf, leaf->map_token, KM_USER1);
2490 leaf->map_token = NULL;
2491 }
2492
Chris Mason5f39d392007-10-15 16:14:19 -04002493 memmove_extent_buffer(leaf, btrfs_item_nr_offset(slot),
2494 btrfs_item_nr_offset(slot + 1),
Chris Masond6025572007-03-30 14:27:56 -04002495 sizeof(struct btrfs_item) *
2496 (nritems - slot - 1));
Chris Masonbe0e5c02007-01-26 15:51:26 -05002497 }
Chris Mason5f39d392007-10-15 16:14:19 -04002498 btrfs_set_header_nritems(leaf, nritems - 1);
Chris Mason7518a232007-03-12 12:01:18 -04002499 nritems--;
Chris Mason5f39d392007-10-15 16:14:19 -04002500
Chris Mason74123bd2007-02-02 11:05:29 -05002501 /* delete the leaf if we've emptied it */
Chris Mason7518a232007-03-12 12:01:18 -04002502 if (nritems == 0) {
Chris Mason5f39d392007-10-15 16:14:19 -04002503 if (leaf == root->node) {
2504 btrfs_set_header_level(leaf, 0);
Chris Mason9a8dd152007-02-23 08:38:36 -05002505 } else {
Chris Mason7bb86312007-12-11 09:25:06 -05002506 u64 root_gen = btrfs_header_generation(path->nodes[1]);
Chris Mason5f39d392007-10-15 16:14:19 -04002507 clean_tree_block(trans, root, leaf);
2508 wait_on_tree_block_writeback(root, leaf);
Chris Masone089f052007-03-16 16:20:31 -04002509 wret = del_ptr(trans, root, path, 1, path->slots[1]);
Chris Masonaa5d6be2007-02-28 16:35:06 -05002510 if (wret)
2511 ret = wret;
Chris Masone089f052007-03-16 16:20:31 -04002512 wret = btrfs_free_extent(trans, root,
Chris Mason7bb86312007-12-11 09:25:06 -05002513 leaf->start, leaf->len,
2514 btrfs_header_owner(path->nodes[1]),
2515 root_gen, 0, 0, 1);
Chris Mason0f70abe2007-02-28 16:46:22 -05002516 if (wret)
2517 ret = wret;
Chris Mason9a8dd152007-02-23 08:38:36 -05002518 }
Chris Masonbe0e5c02007-01-26 15:51:26 -05002519 } else {
Chris Mason7518a232007-03-12 12:01:18 -04002520 int used = leaf_space_used(leaf, 0, nritems);
Chris Masonaa5d6be2007-02-28 16:35:06 -05002521 if (slot == 0) {
Chris Mason5f39d392007-10-15 16:14:19 -04002522 struct btrfs_disk_key disk_key;
2523
2524 btrfs_item_key(leaf, &disk_key, 0);
Chris Masone089f052007-03-16 16:20:31 -04002525 wret = fixup_low_keys(trans, root, path,
Chris Mason5f39d392007-10-15 16:14:19 -04002526 &disk_key, 1);
Chris Masonaa5d6be2007-02-28 16:35:06 -05002527 if (wret)
2528 ret = wret;
2529 }
Chris Masonaa5d6be2007-02-28 16:35:06 -05002530
Chris Mason74123bd2007-02-02 11:05:29 -05002531 /* delete the leaf if it is mostly empty */
Chris Mason7936ca32007-10-19 09:22:41 -04002532 if (used < BTRFS_LEAF_DATA_SIZE(root) / 3) {
Chris Masonbe0e5c02007-01-26 15:51:26 -05002533 /* push_leaf_left fixes the path.
2534 * make sure the path still points to our leaf
2535 * for possible call to del_ptr below
2536 */
Chris Mason4920c9a2007-01-26 16:38:42 -05002537 slot = path->slots[1];
Chris Mason5f39d392007-10-15 16:14:19 -04002538 extent_buffer_get(leaf);
2539
Chris Mason34a38212007-11-07 13:31:03 -05002540 wret = push_leaf_right(trans, root, path, 1, 1);
Chris Mason54aa1f42007-06-22 14:16:25 -04002541 if (wret < 0 && wret != -ENOSPC)
Chris Masonaa5d6be2007-02-28 16:35:06 -05002542 ret = wret;
Chris Mason5f39d392007-10-15 16:14:19 -04002543
2544 if (path->nodes[0] == leaf &&
2545 btrfs_header_nritems(leaf)) {
Chris Mason34a38212007-11-07 13:31:03 -05002546 wret = push_leaf_left(trans, root, path, 1, 1);
Chris Mason54aa1f42007-06-22 14:16:25 -04002547 if (wret < 0 && wret != -ENOSPC)
Chris Masonaa5d6be2007-02-28 16:35:06 -05002548 ret = wret;
2549 }
Chris Mason5f39d392007-10-15 16:14:19 -04002550
2551 if (btrfs_header_nritems(leaf) == 0) {
Chris Mason7bb86312007-12-11 09:25:06 -05002552 u64 root_gen;
Chris Masondb945352007-10-15 16:15:53 -04002553 u64 bytenr = leaf->start;
2554 u32 blocksize = leaf->len;
Chris Mason5f39d392007-10-15 16:14:19 -04002555
Chris Mason7bb86312007-12-11 09:25:06 -05002556 root_gen = btrfs_header_generation(
2557 path->nodes[1]);
2558
Chris Mason5f39d392007-10-15 16:14:19 -04002559 clean_tree_block(trans, root, leaf);
2560 wait_on_tree_block_writeback(root, leaf);
2561
Chris Masone089f052007-03-16 16:20:31 -04002562 wret = del_ptr(trans, root, path, 1, slot);
Chris Masonaa5d6be2007-02-28 16:35:06 -05002563 if (wret)
2564 ret = wret;
Chris Mason5f39d392007-10-15 16:14:19 -04002565
2566 free_extent_buffer(leaf);
Chris Masondb945352007-10-15 16:15:53 -04002567 wret = btrfs_free_extent(trans, root, bytenr,
Chris Mason7bb86312007-12-11 09:25:06 -05002568 blocksize,
2569 btrfs_header_owner(path->nodes[1]),
2570 root_gen, 0, 0, 1);
Chris Mason0f70abe2007-02-28 16:46:22 -05002571 if (wret)
2572 ret = wret;
Chris Mason5de08d72007-02-24 06:24:44 -05002573 } else {
Chris Mason5f39d392007-10-15 16:14:19 -04002574 btrfs_mark_buffer_dirty(leaf);
2575 free_extent_buffer(leaf);
Chris Masonbe0e5c02007-01-26 15:51:26 -05002576 }
Chris Masond5719762007-03-23 10:01:08 -04002577 } else {
Chris Mason5f39d392007-10-15 16:14:19 -04002578 btrfs_mark_buffer_dirty(leaf);
Chris Masonbe0e5c02007-01-26 15:51:26 -05002579 }
2580 }
Chris Masonaa5d6be2007-02-28 16:35:06 -05002581 return ret;
Chris Masonbe0e5c02007-01-26 15:51:26 -05002582}
2583
Chris Mason97571fd2007-02-24 13:39:08 -05002584/*
Chris Mason7bb86312007-12-11 09:25:06 -05002585 * walk up the tree as far as required to find the previous leaf.
2586 * returns 0 if it found something or 1 if there are no lesser leaves.
2587 * returns < 0 on io errors.
2588 */
2589int btrfs_prev_leaf(struct btrfs_root *root, struct btrfs_path *path)
2590{
2591 int slot;
2592 int level = 1;
2593 u64 bytenr;
2594 struct extent_buffer *c;
2595 struct extent_buffer *next = NULL;
2596
2597 while(level < BTRFS_MAX_LEVEL) {
2598 if (!path->nodes[level])
2599 return 1;
2600
2601 slot = path->slots[level];
2602 c = path->nodes[level];
2603 if (slot == 0) {
2604 level++;
2605 if (level == BTRFS_MAX_LEVEL)
2606 return 1;
2607 continue;
2608 }
2609 slot--;
2610
2611 bytenr = btrfs_node_blockptr(c, slot);
2612 if (next)
2613 free_extent_buffer(next);
2614
2615 if (path->reada < 0)
2616 reada_for_search(root, path, level, slot);
2617
2618 next = read_tree_block(root, bytenr,
2619 btrfs_level_size(root, level - 1));
2620 break;
2621 }
2622 path->slots[level] = slot;
2623 while(1) {
2624 level--;
2625 c = path->nodes[level];
2626 free_extent_buffer(c);
2627 path->nodes[level] = next;
2628 path->slots[level] = 0;
2629 if (!level)
2630 break;
2631 if (path->reada)
2632 reada_for_search(root, path, level, 0);
2633 next = read_tree_block(root, btrfs_node_blockptr(next, 0),
2634 btrfs_level_size(root, level - 1));
2635 }
2636 return 0;
2637}
2638
2639/*
Chris Mason97571fd2007-02-24 13:39:08 -05002640 * walk up the tree as far as required to find the next leaf.
Chris Mason0f70abe2007-02-28 16:46:22 -05002641 * returns 0 if it found something or 1 if there are no greater leaves.
2642 * returns < 0 on io errors.
Chris Mason97571fd2007-02-24 13:39:08 -05002643 */
Chris Mason234b63a2007-03-13 10:46:10 -04002644int btrfs_next_leaf(struct btrfs_root *root, struct btrfs_path *path)
Chris Masond97e63b2007-02-20 16:40:44 -05002645{
2646 int slot;
2647 int level = 1;
Chris Masondb945352007-10-15 16:15:53 -04002648 u64 bytenr;
Chris Mason5f39d392007-10-15 16:14:19 -04002649 struct extent_buffer *c;
2650 struct extent_buffer *next = NULL;
Chris Masond97e63b2007-02-20 16:40:44 -05002651
Chris Mason234b63a2007-03-13 10:46:10 -04002652 while(level < BTRFS_MAX_LEVEL) {
Chris Masond97e63b2007-02-20 16:40:44 -05002653 if (!path->nodes[level])
Chris Mason0f70abe2007-02-28 16:46:22 -05002654 return 1;
Chris Mason5f39d392007-10-15 16:14:19 -04002655
Chris Masond97e63b2007-02-20 16:40:44 -05002656 slot = path->slots[level] + 1;
2657 c = path->nodes[level];
Chris Mason5f39d392007-10-15 16:14:19 -04002658 if (slot >= btrfs_header_nritems(c)) {
Chris Masond97e63b2007-02-20 16:40:44 -05002659 level++;
Chris Mason7bb86312007-12-11 09:25:06 -05002660 if (level == BTRFS_MAX_LEVEL)
2661 return 1;
Chris Masond97e63b2007-02-20 16:40:44 -05002662 continue;
2663 }
Chris Mason5f39d392007-10-15 16:14:19 -04002664
Chris Masondb945352007-10-15 16:15:53 -04002665 bytenr = btrfs_node_blockptr(c, slot);
Chris Masoncfaa7292007-02-21 17:04:57 -05002666 if (next)
Chris Mason5f39d392007-10-15 16:14:19 -04002667 free_extent_buffer(next);
2668
Chris Mason6702ed42007-08-07 16:15:09 -04002669 if (path->reada)
2670 reada_for_search(root, path, level, slot);
Chris Mason5f39d392007-10-15 16:14:19 -04002671
Chris Masondb945352007-10-15 16:15:53 -04002672 next = read_tree_block(root, bytenr,
2673 btrfs_level_size(root, level -1));
Chris Masond97e63b2007-02-20 16:40:44 -05002674 break;
2675 }
2676 path->slots[level] = slot;
2677 while(1) {
2678 level--;
2679 c = path->nodes[level];
Chris Mason5f39d392007-10-15 16:14:19 -04002680 free_extent_buffer(c);
Chris Masond97e63b2007-02-20 16:40:44 -05002681 path->nodes[level] = next;
2682 path->slots[level] = 0;
2683 if (!level)
2684 break;
Chris Mason6702ed42007-08-07 16:15:09 -04002685 if (path->reada)
Yan32020612007-08-27 15:17:54 -04002686 reada_for_search(root, path, level, 0);
Chris Masondb945352007-10-15 16:15:53 -04002687 next = read_tree_block(root, btrfs_node_blockptr(next, 0),
2688 btrfs_level_size(root, level - 1));
Chris Masond97e63b2007-02-20 16:40:44 -05002689 }
2690 return 0;
2691}