Merge tag 'for_linus' of git://git.kernel.org/pub/scm/linux/kernel/git/mst/vhost
[cris-mirror.git] / fs / btrfs / tree-defrag.c
blobcb65089127cc7fc4af7847ff3282bc1bdc125bce
1 /*
2 * Copyright (C) 2007 Oracle. All rights reserved.
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public
6 * License v2 as published by the Free Software Foundation.
8 * This program is distributed in the hope that it will be useful,
9 * but WITHOUT ANY WARRANTY; without even the implied warranty of
10 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
11 * General Public License for more details.
13 * You should have received a copy of the GNU General Public
14 * License along with this program; if not, write to the
15 * Free Software Foundation, Inc., 59 Temple Place - Suite 330,
16 * Boston, MA 021110-1307, USA.
19 #include <linux/sched.h>
20 #include "ctree.h"
21 #include "disk-io.h"
22 #include "print-tree.h"
23 #include "transaction.h"
24 #include "locking.h"
27 * Defrag all the leaves in a given btree.
28 * Read all the leaves and try to get key order to
29 * better reflect disk order
32 int btrfs_defrag_leaves(struct btrfs_trans_handle *trans,
33 struct btrfs_root *root)
35 struct btrfs_path *path = NULL;
36 struct btrfs_key key;
37 int ret = 0;
38 int wret;
39 int level;
40 int next_key_ret = 0;
41 u64 last_ret = 0;
42 u64 min_trans = 0;
44 if (root->fs_info->extent_root == root) {
46 * there's recursion here right now in the tree locking,
47 * we can't defrag the extent root without deadlock
49 goto out;
52 if (!test_bit(BTRFS_ROOT_REF_COWS, &root->state))
53 goto out;
55 path = btrfs_alloc_path();
56 if (!path)
57 return -ENOMEM;
59 level = btrfs_header_level(root->node);
61 if (level == 0)
62 goto out;
64 if (root->defrag_progress.objectid == 0) {
65 struct extent_buffer *root_node;
66 u32 nritems;
68 root_node = btrfs_lock_root_node(root);
69 btrfs_set_lock_blocking(root_node);
70 nritems = btrfs_header_nritems(root_node);
71 root->defrag_max.objectid = 0;
72 /* from above we know this is not a leaf */
73 btrfs_node_key_to_cpu(root_node, &root->defrag_max,
74 nritems - 1);
75 btrfs_tree_unlock(root_node);
76 free_extent_buffer(root_node);
77 memset(&key, 0, sizeof(key));
78 } else {
79 memcpy(&key, &root->defrag_progress, sizeof(key));
82 path->keep_locks = 1;
84 ret = btrfs_search_forward(root, &key, path, min_trans);
85 if (ret < 0)
86 goto out;
87 if (ret > 0) {
88 ret = 0;
89 goto out;
91 btrfs_release_path(path);
93 * We don't need a lock on a leaf. btrfs_realloc_node() will lock all
94 * leafs from path->nodes[1], so set lowest_level to 1 to avoid later
95 * a deadlock (attempting to write lock an already write locked leaf).
97 path->lowest_level = 1;
98 wret = btrfs_search_slot(trans, root, &key, path, 0, 1);
100 if (wret < 0) {
101 ret = wret;
102 goto out;
104 if (!path->nodes[1]) {
105 ret = 0;
106 goto out;
109 * The node at level 1 must always be locked when our path has
110 * keep_locks set and lowest_level is 1, regardless of the value of
111 * path->slots[1].
113 BUG_ON(path->locks[1] == 0);
114 ret = btrfs_realloc_node(trans, root,
115 path->nodes[1], 0,
116 &last_ret,
117 &root->defrag_progress);
118 if (ret) {
119 WARN_ON(ret == -EAGAIN);
120 goto out;
123 * Now that we reallocated the node we can find the next key. Note that
124 * btrfs_find_next_key() can release our path and do another search
125 * without COWing, this is because even with path->keep_locks = 1,
126 * btrfs_search_slot() / ctree.c:unlock_up() does not keeps a lock on a
127 * node when path->slots[node_level - 1] does not point to the last
128 * item or a slot beyond the last item (ctree.c:unlock_up()). Therefore
129 * we search for the next key after reallocating our node.
131 path->slots[1] = btrfs_header_nritems(path->nodes[1]);
132 next_key_ret = btrfs_find_next_key(root, path, &key, 1,
133 min_trans);
134 if (next_key_ret == 0) {
135 memcpy(&root->defrag_progress, &key, sizeof(key));
136 ret = -EAGAIN;
138 out:
139 btrfs_free_path(path);
140 if (ret == -EAGAIN) {
141 if (root->defrag_max.objectid > root->defrag_progress.objectid)
142 goto done;
143 if (root->defrag_max.type > root->defrag_progress.type)
144 goto done;
145 if (root->defrag_max.offset > root->defrag_progress.offset)
146 goto done;
147 ret = 0;
149 done:
150 if (ret != -EAGAIN) {
151 memset(&root->defrag_progress, 0,
152 sizeof(root->defrag_progress));
153 root->defrag_trans_start = trans->transid;
155 return ret;