blob: c09dbe4bd6e78a9fe7e4b83d8a5fb39554d7c94c [file] [log] [blame]
Chris Mason6702ed42007-08-07 16:15:09 -04001/*
2 * Copyright (C) 2007 Oracle. All rights reserved.
3 *
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public
6 * License v2 as published by the Free Software Foundation.
7 *
8 * This program is distributed in the hope that it will be useful,
9 * but WITHOUT ANY WARRANTY; without even the implied warranty of
10 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
11 * General Public License for more details.
12 *
13 * You should have received a copy of the GNU General Public
14 * License along with this program; if not, write to the
15 * Free Software Foundation, Inc., 59 Temple Place - Suite 330,
16 * Boston, MA 021110-1307, USA.
17 */
18
19#include <linux/sched.h>
20#include "ctree.h"
21#include "disk-io.h"
22#include "print-tree.h"
23#include "transaction.h"
Chris Masone7a84562008-06-25 16:01:31 -040024#include "locking.h"
Chris Mason6702ed42007-08-07 16:15:09 -040025
Eric Sandeende78b512013-01-31 18:21:12 +000026/*
27 * Defrag all the leaves in a given btree.
28 * Read all the leaves and try to get key order to
Chris Masond352ac62008-09-29 15:18:18 -040029 * better reflect disk order
30 */
Chris Masond3977122009-01-05 21:25:51 -050031
Chris Mason6702ed42007-08-07 16:15:09 -040032int btrfs_defrag_leaves(struct btrfs_trans_handle *trans,
Eric Sandeende78b512013-01-31 18:21:12 +000033 struct btrfs_root *root)
Chris Mason6702ed42007-08-07 16:15:09 -040034{
35 struct btrfs_path *path = NULL;
Chris Masone7a84562008-06-25 16:01:31 -040036 struct btrfs_key key;
Chris Mason6702ed42007-08-07 16:15:09 -040037 int ret = 0;
38 int wret;
39 int level;
Chris Masone7a84562008-06-25 16:01:31 -040040 int next_key_ret = 0;
Chris Masone9d0b132007-08-10 14:06:19 -040041 u64 last_ret = 0;
Chris Mason3f157a22008-06-25 16:01:31 -040042
Chris Masone7a84562008-06-25 16:01:31 -040043 if (root->fs_info->extent_root == root) {
Chris Mason1b1e2132008-06-25 16:01:31 -040044 /*
45 * there's recursion here right now in the tree locking,
46 * we can't defrag the extent root without deadlock
47 */
48 goto out;
Chris Masone7a84562008-06-25 16:01:31 -040049 }
Chris Mason925baed2008-06-25 16:01:30 -040050
Miao Xie27cdeb72014-04-02 19:51:05 +080051 if (!test_bit(BTRFS_ROOT_REF_COWS, &root->state))
Chris Mason6702ed42007-08-07 16:15:09 -040052 goto out;
Chris Mason5f39d392007-10-15 16:14:19 -040053
Chris Mason6702ed42007-08-07 16:15:09 -040054 path = btrfs_alloc_path();
55 if (!path)
56 return -ENOMEM;
57
Chris Mason5f39d392007-10-15 16:14:19 -040058 level = btrfs_header_level(root->node);
Chris Mason0f1ebbd2007-10-15 16:19:46 -040059
Chris Masond3977122009-01-05 21:25:51 -050060 if (level == 0)
Chris Mason6702ed42007-08-07 16:15:09 -040061 goto out;
Chris Masond3977122009-01-05 21:25:51 -050062
Chris Mason6702ed42007-08-07 16:15:09 -040063 if (root->defrag_progress.objectid == 0) {
Chris Masone7a84562008-06-25 16:01:31 -040064 struct extent_buffer *root_node;
Chris Mason0ef3e662008-05-24 14:04:53 -040065 u32 nritems;
66
Chris Masone7a84562008-06-25 16:01:31 -040067 root_node = btrfs_lock_root_node(root);
Chris Masonb4ce94d2009-02-04 09:25:08 -050068 btrfs_set_lock_blocking(root_node);
Chris Masone7a84562008-06-25 16:01:31 -040069 nritems = btrfs_header_nritems(root_node);
Chris Mason0ef3e662008-05-24 14:04:53 -040070 root->defrag_max.objectid = 0;
71 /* from above we know this is not a leaf */
Chris Masone7a84562008-06-25 16:01:31 -040072 btrfs_node_key_to_cpu(root_node, &root->defrag_max,
Chris Mason0ef3e662008-05-24 14:04:53 -040073 nritems - 1);
Chris Masone7a84562008-06-25 16:01:31 -040074 btrfs_tree_unlock(root_node);
75 free_extent_buffer(root_node);
76 memset(&key, 0, sizeof(key));
Chris Mason6702ed42007-08-07 16:15:09 -040077 } else {
Chris Masone7a84562008-06-25 16:01:31 -040078 memcpy(&key, &root->defrag_progress, sizeof(key));
Chris Mason6702ed42007-08-07 16:15:09 -040079 }
80
Chris Masone7a84562008-06-25 16:01:31 -040081 path->keep_locks = 1;
Chris Mason3f157a22008-06-25 16:01:31 -040082
Anand Jain7c829b72018-03-07 17:29:18 +080083 ret = btrfs_search_forward(root, &key, path, BTRFS_OLDEST_GENERATION);
Chris Mason3f157a22008-06-25 16:01:31 -040084 if (ret < 0)
85 goto out;
86 if (ret > 0) {
87 ret = 0;
88 goto out;
89 }
David Sterbab3b4aa72011-04-21 01:20:15 +020090 btrfs_release_path(path);
Filipe Manana03763742015-12-18 01:57:29 +000091 /*
92 * We don't need a lock on a leaf. btrfs_realloc_node() will lock all
93 * leafs from path->nodes[1], so set lowest_level to 1 to avoid later
94 * a deadlock (attempting to write lock an already write locked leaf).
95 */
96 path->lowest_level = 1;
Chris Masone7a84562008-06-25 16:01:31 -040097 wret = btrfs_search_slot(trans, root, &key, path, 0, 1);
Chris Mason6702ed42007-08-07 16:15:09 -040098
Chris Masone7a84562008-06-25 16:01:31 -040099 if (wret < 0) {
100 ret = wret;
101 goto out;
Chris Mason6702ed42007-08-07 16:15:09 -0400102 }
Chris Masone7a84562008-06-25 16:01:31 -0400103 if (!path->nodes[1]) {
104 ret = 0;
105 goto out;
106 }
Filipe Manana03763742015-12-18 01:57:29 +0000107 /*
108 * The node at level 1 must always be locked when our path has
109 * keep_locks set and lowest_level is 1, regardless of the value of
110 * path->slots[1].
111 */
112 BUG_ON(path->locks[1] == 0);
Chris Masone7a84562008-06-25 16:01:31 -0400113 ret = btrfs_realloc_node(trans, root,
114 path->nodes[1], 0,
Eric Sandeende78b512013-01-31 18:21:12 +0000115 &last_ret,
Chris Masone7a84562008-06-25 16:01:31 -0400116 &root->defrag_progress);
Yan, Zheng8929ecfa2010-05-16 10:49:58 -0400117 if (ret) {
118 WARN_ON(ret == -EAGAIN);
119 goto out;
120 }
Filipe Manana03763742015-12-18 01:57:29 +0000121 /*
122 * Now that we reallocated the node we can find the next key. Note that
123 * btrfs_find_next_key() can release our path and do another search
124 * without COWing, this is because even with path->keep_locks = 1,
125 * btrfs_search_slot() / ctree.c:unlock_up() does not keeps a lock on a
126 * node when path->slots[node_level - 1] does not point to the last
127 * item or a slot beyond the last item (ctree.c:unlock_up()). Therefore
128 * we search for the next key after reallocating our node.
129 */
130 path->slots[1] = btrfs_header_nritems(path->nodes[1]);
131 next_key_ret = btrfs_find_next_key(root, path, &key, 1,
Anand Jain7c829b72018-03-07 17:29:18 +0800132 BTRFS_OLDEST_GENERATION);
Chris Masone7a84562008-06-25 16:01:31 -0400133 if (next_key_ret == 0) {
134 memcpy(&root->defrag_progress, &key, sizeof(key));
135 ret = -EAGAIN;
136 }
Chris Mason6702ed42007-08-07 16:15:09 -0400137out:
Tsutomu Itoh527afb42015-08-19 14:55:00 +0900138 btrfs_free_path(path);
Chris Mason0ef3e662008-05-24 14:04:53 -0400139 if (ret == -EAGAIN) {
140 if (root->defrag_max.objectid > root->defrag_progress.objectid)
141 goto done;
142 if (root->defrag_max.type > root->defrag_progress.type)
143 goto done;
144 if (root->defrag_max.offset > root->defrag_progress.offset)
145 goto done;
146 ret = 0;
147 }
148done:
Chris Mason6702ed42007-08-07 16:15:09 -0400149 if (ret != -EAGAIN) {
150 memset(&root->defrag_progress, 0,
151 sizeof(root->defrag_progress));
Chris Mason3f157a22008-06-25 16:01:31 -0400152 root->defrag_trans_start = trans->transid;
Chris Mason6702ed42007-08-07 16:15:09 -0400153 }
154 return ret;
155}