Commit | Line | Data |
---|---|---|
6cbd5570 CM |
1 | /* |
2 | * Copyright (C) 2007 Oracle. All rights reserved. | |
3 | * | |
4 | * This program is free software; you can redistribute it and/or | |
5 | * modify it under the terms of the GNU General Public | |
6 | * License v2 as published by the Free Software Foundation. | |
7 | * | |
8 | * This program is distributed in the hope that it will be useful, | |
9 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | |
10 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
11 | * General Public License for more details. | |
12 | * | |
13 | * You should have received a copy of the GNU General Public | |
14 | * License along with this program; if not, write to the | |
15 | * Free Software Foundation, Inc., 59 Temple Place - Suite 330, | |
16 | * Boston, MA 021110-1307, USA. | |
17 | */ | |
18 | ||
2e635a27 | 19 | #include <linux/module.h> |
fec577fb CM |
20 | #include "ctree.h" |
21 | #include "disk-io.h" | |
22 | #include "print-tree.h" | |
e089f05c | 23 | #include "transaction.h" |
fec577fb | 24 | |
e089f05c | 25 | static int find_free_extent(struct btrfs_trans_handle *trans, struct btrfs_root |
fbdc762b CM |
26 | *orig_root, u64 num_blocks, u64 search_start, |
27 | u64 search_end, u64 hint_block, | |
f2654de4 CM |
28 | struct btrfs_key *ins, u64 exclude_start, |
29 | u64 exclude_nr, int data); | |
e089f05c CM |
30 | static int finish_current_insert(struct btrfs_trans_handle *trans, struct |
31 | btrfs_root *extent_root); | |
e20d96d6 CM |
32 | static int del_pending_extents(struct btrfs_trans_handle *trans, struct |
33 | btrfs_root *extent_root); | |
fec577fb | 34 | |
de428b63 CM |
35 | static void reada_extent_leaves(struct btrfs_root *root, |
36 | struct btrfs_path *path, u64 limit) | |
37 | { | |
38 | struct btrfs_node *node; | |
39 | int i; | |
40 | int nritems; | |
41 | u64 item_objectid; | |
42 | u64 blocknr; | |
43 | int slot; | |
44 | int ret; | |
45 | ||
46 | if (!path->nodes[1]) | |
47 | return; | |
48 | node = btrfs_buffer_node(path->nodes[1]); | |
49 | slot = path->slots[1] + 1; | |
50 | nritems = btrfs_header_nritems(&node->header); | |
51 | for (i = slot; i < nritems && i < slot + 8; i++) { | |
52 | item_objectid = btrfs_disk_key_objectid(&node->ptrs[i].key); | |
53 | if (item_objectid > limit) | |
54 | break; | |
55 | blocknr = btrfs_node_blockptr(node, i); | |
56 | ret = readahead_tree_block(root, blocknr); | |
57 | if (ret) | |
58 | break; | |
59 | } | |
60 | } | |
61 | ||
e37c9e69 CM |
62 | static int cache_block_group(struct btrfs_root *root, |
63 | struct btrfs_block_group_cache *block_group) | |
64 | { | |
65 | struct btrfs_path *path; | |
66 | int ret; | |
67 | struct btrfs_key key; | |
68 | struct btrfs_leaf *leaf; | |
69 | struct radix_tree_root *extent_radix; | |
70 | int slot; | |
71 | u64 i; | |
72 | u64 last = 0; | |
73 | u64 hole_size; | |
de428b63 | 74 | u64 limit; |
e37c9e69 CM |
75 | int found = 0; |
76 | ||
77 | root = root->fs_info->extent_root; | |
78 | extent_radix = &root->fs_info->extent_map_radix; | |
79 | ||
80 | if (block_group->cached) | |
81 | return 0; | |
82 | if (block_group->data) | |
83 | return 0; | |
84 | path = btrfs_alloc_path(); | |
85 | if (!path) | |
86 | return -ENOMEM; | |
e37c9e69 CM |
87 | key.objectid = block_group->key.objectid; |
88 | key.flags = 0; | |
89 | key.offset = 0; | |
90 | btrfs_set_key_type(&key, BTRFS_EXTENT_ITEM_KEY); | |
91 | ret = btrfs_search_slot(NULL, root, &key, path, 0, 0); | |
92 | if (ret < 0) | |
93 | return ret; | |
94 | if (ret && path->slots[0] > 0) | |
95 | path->slots[0]--; | |
de428b63 CM |
96 | limit = block_group->key.objectid + block_group->key.offset; |
97 | reada_extent_leaves(root, path, limit); | |
e37c9e69 CM |
98 | while(1) { |
99 | leaf = btrfs_buffer_leaf(path->nodes[0]); | |
100 | slot = path->slots[0]; | |
101 | if (slot >= btrfs_header_nritems(&leaf->header)) { | |
de428b63 | 102 | reada_extent_leaves(root, path, limit); |
e37c9e69 | 103 | ret = btrfs_next_leaf(root, path); |
54aa1f4d CM |
104 | if (ret < 0) |
105 | goto err; | |
de428b63 | 106 | if (ret == 0) { |
e37c9e69 | 107 | continue; |
de428b63 | 108 | } else { |
e37c9e69 CM |
109 | if (found) { |
110 | hole_size = block_group->key.objectid + | |
111 | block_group->key.offset - last; | |
112 | } else { | |
113 | last = block_group->key.objectid; | |
114 | hole_size = block_group->key.offset; | |
115 | } | |
116 | for (i = 0; i < hole_size; i++) { | |
117 | set_radix_bit(extent_radix, | |
118 | last + i); | |
119 | } | |
120 | break; | |
121 | } | |
122 | } | |
123 | btrfs_disk_key_to_cpu(&key, &leaf->items[slot].key); | |
124 | if (key.objectid >= block_group->key.objectid + | |
125 | block_group->key.offset) { | |
126 | if (found) { | |
127 | hole_size = block_group->key.objectid + | |
128 | block_group->key.offset - last; | |
129 | } else { | |
130 | last = block_group->key.objectid; | |
131 | hole_size = block_group->key.offset; | |
132 | } | |
133 | for (i = 0; i < hole_size; i++) { | |
134 | set_radix_bit(extent_radix, last + i); | |
135 | } | |
136 | break; | |
137 | } | |
138 | if (btrfs_key_type(&key) == BTRFS_EXTENT_ITEM_KEY) { | |
139 | if (!found) { | |
140 | last = key.objectid + key.offset; | |
141 | found = 1; | |
142 | } else { | |
143 | hole_size = key.objectid - last; | |
144 | for (i = 0; i < hole_size; i++) { | |
145 | set_radix_bit(extent_radix, last + i); | |
146 | } | |
147 | last = key.objectid + key.offset; | |
148 | } | |
149 | } | |
150 | path->slots[0]++; | |
151 | } | |
152 | ||
153 | block_group->cached = 1; | |
54aa1f4d | 154 | err: |
e37c9e69 CM |
155 | btrfs_free_path(path); |
156 | return 0; | |
157 | } | |
158 | ||
5276aeda CM |
159 | struct btrfs_block_group_cache *btrfs_lookup_block_group(struct |
160 | btrfs_fs_info *info, | |
161 | u64 blocknr) | |
be744175 CM |
162 | { |
163 | struct btrfs_block_group_cache *block_group; | |
164 | int ret; | |
165 | ||
166 | ret = radix_tree_gang_lookup(&info->block_group_radix, | |
167 | (void **)&block_group, | |
168 | blocknr, 1); | |
169 | if (ret) { | |
3e1ad54f | 170 | if (block_group->key.objectid <= blocknr && blocknr <= |
be744175 CM |
171 | block_group->key.objectid + block_group->key.offset) |
172 | return block_group; | |
173 | } | |
174 | ret = radix_tree_gang_lookup(&info->block_group_data_radix, | |
175 | (void **)&block_group, | |
176 | blocknr, 1); | |
177 | if (ret) { | |
3e1ad54f | 178 | if (block_group->key.objectid <= blocknr && blocknr <= |
be744175 CM |
179 | block_group->key.objectid + block_group->key.offset) |
180 | return block_group; | |
181 | } | |
be744175 CM |
182 | return NULL; |
183 | } | |
184 | ||
e37c9e69 CM |
185 | static u64 leaf_range(struct btrfs_root *root) |
186 | { | |
187 | u64 size = BTRFS_LEAF_DATA_SIZE(root); | |
84f54cfa CM |
188 | do_div(size, sizeof(struct btrfs_extent_item) + |
189 | sizeof(struct btrfs_item)); | |
e37c9e69 CM |
190 | return size; |
191 | } | |
192 | ||
193 | static u64 find_search_start(struct btrfs_root *root, | |
194 | struct btrfs_block_group_cache **cache_ret, | |
195 | u64 search_start, int num) | |
196 | { | |
197 | unsigned long gang[8]; | |
198 | int ret; | |
199 | struct btrfs_block_group_cache *cache = *cache_ret; | |
200 | u64 last = max(search_start, cache->key.objectid); | |
201 | ||
202 | if (cache->data) | |
203 | goto out; | |
204 | if (num > 1) { | |
205 | last = max(last, cache->last_prealloc); | |
206 | } | |
207 | again: | |
54aa1f4d CM |
208 | ret = cache_block_group(root, cache); |
209 | if (ret) | |
210 | goto out; | |
e37c9e69 CM |
211 | while(1) { |
212 | ret = find_first_radix_bit(&root->fs_info->extent_map_radix, | |
213 | gang, last, ARRAY_SIZE(gang)); | |
214 | if (!ret) | |
215 | goto out; | |
216 | last = gang[ret-1] + 1; | |
217 | if (num > 1) { | |
218 | if (ret != ARRAY_SIZE(gang)) { | |
219 | goto new_group; | |
220 | } | |
221 | if (gang[ret-1] - gang[0] > leaf_range(root)) { | |
222 | continue; | |
223 | } | |
224 | } | |
225 | if (gang[0] >= cache->key.objectid + cache->key.offset) { | |
226 | goto new_group; | |
227 | } | |
228 | return gang[0]; | |
229 | } | |
230 | out: | |
231 | return max(cache->last_alloc, search_start); | |
232 | ||
233 | new_group: | |
5276aeda CM |
234 | cache = btrfs_lookup_block_group(root->fs_info, |
235 | last + cache->key.offset - 1); | |
e37c9e69 CM |
236 | if (!cache) { |
237 | return max((*cache_ret)->last_alloc, search_start); | |
238 | } | |
239 | cache = btrfs_find_block_group(root, cache, | |
de428b63 | 240 | last + cache->key.offset - 1, 0, 0); |
e37c9e69 CM |
241 | *cache_ret = cache; |
242 | goto again; | |
243 | } | |
244 | ||
84f54cfa CM |
245 | static u64 div_factor(u64 num, int factor) |
246 | { | |
247 | num *= factor; | |
248 | do_div(num, 10); | |
249 | return num; | |
250 | } | |
251 | ||
31f3c99b CM |
252 | struct btrfs_block_group_cache *btrfs_find_block_group(struct btrfs_root *root, |
253 | struct btrfs_block_group_cache | |
be744175 | 254 | *hint, u64 search_start, |
de428b63 | 255 | int data, int owner) |
cd1bc465 CM |
256 | { |
257 | struct btrfs_block_group_cache *cache[8]; | |
31f3c99b | 258 | struct btrfs_block_group_cache *found_group = NULL; |
cd1bc465 | 259 | struct btrfs_fs_info *info = root->fs_info; |
be744175 | 260 | struct radix_tree_root *radix; |
1e2677e0 | 261 | struct radix_tree_root *swap_radix; |
cd1bc465 | 262 | u64 used; |
31f3c99b CM |
263 | u64 last = 0; |
264 | u64 hint_last; | |
cd1bc465 CM |
265 | int i; |
266 | int ret; | |
31f3c99b | 267 | int full_search = 0; |
de428b63 | 268 | int factor = 8; |
1e2677e0 | 269 | int data_swap = 0; |
de428b63 CM |
270 | |
271 | if (!owner) | |
272 | factor = 5; | |
be744175 | 273 | |
1e2677e0 | 274 | if (data) { |
be744175 | 275 | radix = &info->block_group_data_radix; |
1e2677e0 CM |
276 | swap_radix = &info->block_group_radix; |
277 | } else { | |
be744175 | 278 | radix = &info->block_group_radix; |
1e2677e0 CM |
279 | swap_radix = &info->block_group_data_radix; |
280 | } | |
be744175 CM |
281 | |
282 | if (search_start) { | |
283 | struct btrfs_block_group_cache *shint; | |
5276aeda | 284 | shint = btrfs_lookup_block_group(info, search_start); |
be744175 CM |
285 | if (shint->data == data) { |
286 | used = btrfs_block_group_used(&shint->item); | |
287 | if (used + shint->pinned < | |
84f54cfa | 288 | div_factor(shint->key.offset, factor)) { |
be744175 CM |
289 | return shint; |
290 | } | |
291 | } | |
292 | } | |
293 | if (hint && hint->data == data) { | |
31f3c99b | 294 | used = btrfs_block_group_used(&hint->item); |
84f54cfa CM |
295 | if (used + hint->pinned < |
296 | div_factor(hint->key.offset, factor)) { | |
31f3c99b CM |
297 | return hint; |
298 | } | |
84f54cfa | 299 | if (used >= div_factor(hint->key.offset, 8)) { |
be744175 CM |
300 | radix_tree_tag_clear(radix, |
301 | hint->key.objectid + | |
302 | hint->key.offset - 1, | |
303 | BTRFS_BLOCK_GROUP_AVAIL); | |
304 | } | |
8d7be552 | 305 | last = hint->key.offset * 3; |
be744175 | 306 | if (hint->key.objectid >= last) |
e37c9e69 CM |
307 | last = max(search_start + hint->key.offset - 1, |
308 | hint->key.objectid - last); | |
be744175 CM |
309 | else |
310 | last = hint->key.objectid + hint->key.offset; | |
31f3c99b CM |
311 | hint_last = last; |
312 | } else { | |
e37c9e69 CM |
313 | if (hint) |
314 | hint_last = max(hint->key.objectid, search_start); | |
315 | else | |
316 | hint_last = search_start; | |
317 | ||
318 | last = hint_last; | |
31f3c99b | 319 | } |
cd1bc465 | 320 | while(1) { |
be744175 | 321 | ret = radix_tree_gang_lookup_tag(radix, (void **)cache, |
cd1bc465 | 322 | last, ARRAY_SIZE(cache), |
31f3c99b | 323 | BTRFS_BLOCK_GROUP_AVAIL); |
cd1bc465 CM |
324 | if (!ret) |
325 | break; | |
326 | for (i = 0; i < ret; i++) { | |
be08c1b9 CM |
327 | last = cache[i]->key.objectid + |
328 | cache[i]->key.offset; | |
cd1bc465 | 329 | used = btrfs_block_group_used(&cache[i]->item); |
be744175 | 330 | if (used + cache[i]->pinned < |
84f54cfa | 331 | div_factor(cache[i]->key.offset, factor)) { |
31f3c99b CM |
332 | found_group = cache[i]; |
333 | goto found; | |
cd1bc465 | 334 | } |
84f54cfa | 335 | if (used >= div_factor(cache[i]->key.offset, 8)) { |
be744175 CM |
336 | radix_tree_tag_clear(radix, |
337 | cache[i]->key.objectid + | |
338 | cache[i]->key.offset - 1, | |
339 | BTRFS_BLOCK_GROUP_AVAIL); | |
340 | } | |
cd1bc465 | 341 | } |
de428b63 | 342 | cond_resched(); |
cd1bc465 | 343 | } |
31f3c99b CM |
344 | last = hint_last; |
345 | again: | |
cd1bc465 | 346 | while(1) { |
be744175 CM |
347 | ret = radix_tree_gang_lookup(radix, (void **)cache, |
348 | last, ARRAY_SIZE(cache)); | |
cd1bc465 CM |
349 | if (!ret) |
350 | break; | |
351 | for (i = 0; i < ret; i++) { | |
be08c1b9 CM |
352 | last = cache[i]->key.objectid + |
353 | cache[i]->key.offset; | |
cd1bc465 | 354 | used = btrfs_block_group_used(&cache[i]->item); |
be744175 | 355 | if (used + cache[i]->pinned < cache[i]->key.offset) { |
31f3c99b CM |
356 | found_group = cache[i]; |
357 | goto found; | |
cd1bc465 | 358 | } |
be744175 CM |
359 | if (used >= cache[i]->key.offset) { |
360 | radix_tree_tag_clear(radix, | |
361 | cache[i]->key.objectid + | |
362 | cache[i]->key.offset - 1, | |
363 | BTRFS_BLOCK_GROUP_AVAIL); | |
364 | } | |
cd1bc465 | 365 | } |
de428b63 | 366 | cond_resched(); |
cd1bc465 | 367 | } |
31f3c99b | 368 | if (!full_search) { |
be744175 | 369 | last = search_start; |
31f3c99b CM |
370 | full_search = 1; |
371 | goto again; | |
372 | } | |
1e2677e0 CM |
373 | if (!data_swap) { |
374 | struct radix_tree_root *tmp = radix; | |
375 | data_swap = 1; | |
376 | radix = swap_radix; | |
377 | swap_radix = tmp; | |
378 | last = search_start; | |
379 | goto again; | |
380 | } | |
31f3c99b | 381 | if (!found_group) { |
be744175 | 382 | ret = radix_tree_gang_lookup(radix, |
31f3c99b | 383 | (void **)&found_group, 0, 1); |
1e2677e0 CM |
384 | if (ret == 0) { |
385 | ret = radix_tree_gang_lookup(swap_radix, | |
386 | (void **)&found_group, | |
387 | 0, 1); | |
388 | } | |
31f3c99b CM |
389 | BUG_ON(ret != 1); |
390 | } | |
be744175 | 391 | found: |
31f3c99b | 392 | return found_group; |
cd1bc465 CM |
393 | } |
394 | ||
b18c6685 CM |
395 | int btrfs_inc_extent_ref(struct btrfs_trans_handle *trans, |
396 | struct btrfs_root *root, | |
397 | u64 blocknr, u64 num_blocks) | |
02217ed2 | 398 | { |
5caf2a00 | 399 | struct btrfs_path *path; |
02217ed2 | 400 | int ret; |
e2fa7227 | 401 | struct btrfs_key key; |
234b63a0 CM |
402 | struct btrfs_leaf *l; |
403 | struct btrfs_extent_item *item; | |
e2fa7227 | 404 | struct btrfs_key ins; |
cf27e1ee | 405 | u32 refs; |
037e6390 | 406 | |
5caf2a00 | 407 | path = btrfs_alloc_path(); |
54aa1f4d CM |
408 | if (!path) |
409 | return -ENOMEM; | |
410 | ret = find_free_extent(trans, root->fs_info->extent_root, 0, 0, | |
f2654de4 | 411 | (u64)-1, 0, &ins, 0, 0, 0); |
54aa1f4d CM |
412 | if (ret) { |
413 | btrfs_free_path(path); | |
414 | return ret; | |
415 | } | |
02217ed2 CM |
416 | key.objectid = blocknr; |
417 | key.flags = 0; | |
62e2749e | 418 | btrfs_set_key_type(&key, BTRFS_EXTENT_ITEM_KEY); |
6407bf6d | 419 | key.offset = num_blocks; |
5caf2a00 | 420 | ret = btrfs_search_slot(trans, root->fs_info->extent_root, &key, path, |
9f5fae2f | 421 | 0, 1); |
54aa1f4d CM |
422 | if (ret < 0) |
423 | return ret; | |
a429e513 | 424 | if (ret != 0) { |
a28ec197 | 425 | BUG(); |
a429e513 | 426 | } |
02217ed2 | 427 | BUG_ON(ret != 0); |
5caf2a00 CM |
428 | l = btrfs_buffer_leaf(path->nodes[0]); |
429 | item = btrfs_item_ptr(l, path->slots[0], struct btrfs_extent_item); | |
cf27e1ee CM |
430 | refs = btrfs_extent_refs(item); |
431 | btrfs_set_extent_refs(item, refs + 1); | |
5caf2a00 | 432 | btrfs_mark_buffer_dirty(path->nodes[0]); |
a28ec197 | 433 | |
5caf2a00 CM |
434 | btrfs_release_path(root->fs_info->extent_root, path); |
435 | btrfs_free_path(path); | |
9f5fae2f | 436 | finish_current_insert(trans, root->fs_info->extent_root); |
e20d96d6 | 437 | del_pending_extents(trans, root->fs_info->extent_root); |
02217ed2 CM |
438 | return 0; |
439 | } | |
440 | ||
b18c6685 CM |
441 | static int lookup_extent_ref(struct btrfs_trans_handle *trans, |
442 | struct btrfs_root *root, u64 blocknr, | |
443 | u64 num_blocks, u32 *refs) | |
a28ec197 | 444 | { |
5caf2a00 | 445 | struct btrfs_path *path; |
a28ec197 | 446 | int ret; |
e2fa7227 | 447 | struct btrfs_key key; |
234b63a0 CM |
448 | struct btrfs_leaf *l; |
449 | struct btrfs_extent_item *item; | |
5caf2a00 CM |
450 | |
451 | path = btrfs_alloc_path(); | |
a28ec197 | 452 | key.objectid = blocknr; |
6407bf6d | 453 | key.offset = num_blocks; |
62e2749e CM |
454 | key.flags = 0; |
455 | btrfs_set_key_type(&key, BTRFS_EXTENT_ITEM_KEY); | |
5caf2a00 | 456 | ret = btrfs_search_slot(trans, root->fs_info->extent_root, &key, path, |
9f5fae2f | 457 | 0, 0); |
54aa1f4d CM |
458 | if (ret < 0) |
459 | goto out; | |
a28ec197 CM |
460 | if (ret != 0) |
461 | BUG(); | |
5caf2a00 CM |
462 | l = btrfs_buffer_leaf(path->nodes[0]); |
463 | item = btrfs_item_ptr(l, path->slots[0], struct btrfs_extent_item); | |
cf27e1ee | 464 | *refs = btrfs_extent_refs(item); |
54aa1f4d | 465 | out: |
5caf2a00 | 466 | btrfs_free_path(path); |
a28ec197 CM |
467 | return 0; |
468 | } | |
469 | ||
c5739bba CM |
470 | int btrfs_inc_root_ref(struct btrfs_trans_handle *trans, |
471 | struct btrfs_root *root) | |
472 | { | |
b18c6685 | 473 | return btrfs_inc_extent_ref(trans, root, bh_blocknr(root->node), 1); |
c5739bba CM |
474 | } |
475 | ||
e089f05c | 476 | int btrfs_inc_ref(struct btrfs_trans_handle *trans, struct btrfs_root *root, |
e20d96d6 | 477 | struct buffer_head *buf) |
02217ed2 CM |
478 | { |
479 | u64 blocknr; | |
e20d96d6 | 480 | struct btrfs_node *buf_node; |
6407bf6d CM |
481 | struct btrfs_leaf *buf_leaf; |
482 | struct btrfs_disk_key *key; | |
483 | struct btrfs_file_extent_item *fi; | |
02217ed2 | 484 | int i; |
6407bf6d CM |
485 | int leaf; |
486 | int ret; | |
54aa1f4d CM |
487 | int faili; |
488 | int err; | |
a28ec197 | 489 | |
3768f368 | 490 | if (!root->ref_cows) |
a28ec197 | 491 | return 0; |
e20d96d6 | 492 | buf_node = btrfs_buffer_node(buf); |
6407bf6d CM |
493 | leaf = btrfs_is_leaf(buf_node); |
494 | buf_leaf = btrfs_buffer_leaf(buf); | |
e20d96d6 | 495 | for (i = 0; i < btrfs_header_nritems(&buf_node->header); i++) { |
6407bf6d | 496 | if (leaf) { |
3a686375 | 497 | u64 disk_blocknr; |
6407bf6d CM |
498 | key = &buf_leaf->items[i].key; |
499 | if (btrfs_disk_key_type(key) != BTRFS_EXTENT_DATA_KEY) | |
500 | continue; | |
501 | fi = btrfs_item_ptr(buf_leaf, i, | |
502 | struct btrfs_file_extent_item); | |
236454df CM |
503 | if (btrfs_file_extent_type(fi) == |
504 | BTRFS_FILE_EXTENT_INLINE) | |
505 | continue; | |
3a686375 CM |
506 | disk_blocknr = btrfs_file_extent_disk_blocknr(fi); |
507 | if (disk_blocknr == 0) | |
508 | continue; | |
509 | ret = btrfs_inc_extent_ref(trans, root, disk_blocknr, | |
6407bf6d | 510 | btrfs_file_extent_disk_num_blocks(fi)); |
54aa1f4d CM |
511 | if (ret) { |
512 | faili = i; | |
513 | goto fail; | |
514 | } | |
6407bf6d CM |
515 | } else { |
516 | blocknr = btrfs_node_blockptr(buf_node, i); | |
b18c6685 | 517 | ret = btrfs_inc_extent_ref(trans, root, blocknr, 1); |
54aa1f4d CM |
518 | if (ret) { |
519 | faili = i; | |
520 | goto fail; | |
521 | } | |
6407bf6d | 522 | } |
02217ed2 CM |
523 | } |
524 | return 0; | |
54aa1f4d | 525 | fail: |
ccd467d6 | 526 | WARN_ON(1); |
54aa1f4d CM |
527 | for (i =0; i < faili; i++) { |
528 | if (leaf) { | |
529 | u64 disk_blocknr; | |
530 | key = &buf_leaf->items[i].key; | |
531 | if (btrfs_disk_key_type(key) != BTRFS_EXTENT_DATA_KEY) | |
532 | continue; | |
533 | fi = btrfs_item_ptr(buf_leaf, i, | |
534 | struct btrfs_file_extent_item); | |
535 | if (btrfs_file_extent_type(fi) == | |
536 | BTRFS_FILE_EXTENT_INLINE) | |
537 | continue; | |
538 | disk_blocknr = btrfs_file_extent_disk_blocknr(fi); | |
539 | if (disk_blocknr == 0) | |
540 | continue; | |
541 | err = btrfs_free_extent(trans, root, disk_blocknr, | |
542 | btrfs_file_extent_disk_num_blocks(fi), 0); | |
543 | BUG_ON(err); | |
544 | } else { | |
545 | blocknr = btrfs_node_blockptr(buf_node, i); | |
546 | err = btrfs_free_extent(trans, root, blocknr, 1, 0); | |
547 | BUG_ON(err); | |
548 | } | |
549 | } | |
550 | return ret; | |
02217ed2 CM |
551 | } |
552 | ||
9078a3e1 CM |
553 | static int write_one_cache_group(struct btrfs_trans_handle *trans, |
554 | struct btrfs_root *root, | |
555 | struct btrfs_path *path, | |
556 | struct btrfs_block_group_cache *cache) | |
557 | { | |
558 | int ret; | |
559 | int pending_ret; | |
560 | struct btrfs_root *extent_root = root->fs_info->extent_root; | |
561 | struct btrfs_block_group_item *bi; | |
562 | struct btrfs_key ins; | |
563 | ||
f2654de4 CM |
564 | ret = find_free_extent(trans, extent_root, 0, 0, (u64)-1, 0, &ins, |
565 | 0, 0, 0); | |
54aa1f4d CM |
566 | /* FIXME, set bit to recalc cache groups on next mount */ |
567 | if (ret) | |
568 | return ret; | |
9078a3e1 | 569 | ret = btrfs_search_slot(trans, extent_root, &cache->key, path, 0, 1); |
54aa1f4d CM |
570 | if (ret < 0) |
571 | goto fail; | |
9078a3e1 CM |
572 | BUG_ON(ret); |
573 | bi = btrfs_item_ptr(btrfs_buffer_leaf(path->nodes[0]), path->slots[0], | |
574 | struct btrfs_block_group_item); | |
575 | memcpy(bi, &cache->item, sizeof(*bi)); | |
ccd467d6 | 576 | btrfs_mark_buffer_dirty(path->nodes[0]); |
9078a3e1 | 577 | btrfs_release_path(extent_root, path); |
54aa1f4d | 578 | fail: |
9078a3e1 CM |
579 | finish_current_insert(trans, extent_root); |
580 | pending_ret = del_pending_extents(trans, extent_root); | |
581 | if (ret) | |
582 | return ret; | |
583 | if (pending_ret) | |
584 | return pending_ret; | |
be744175 CM |
585 | if (cache->data) |
586 | cache->last_alloc = cache->first_free; | |
9078a3e1 CM |
587 | return 0; |
588 | ||
589 | } | |
590 | ||
be744175 CM |
591 | static int write_dirty_block_radix(struct btrfs_trans_handle *trans, |
592 | struct btrfs_root *root, | |
593 | struct radix_tree_root *radix) | |
9078a3e1 CM |
594 | { |
595 | struct btrfs_block_group_cache *cache[8]; | |
596 | int ret; | |
597 | int err = 0; | |
598 | int werr = 0; | |
9078a3e1 CM |
599 | int i; |
600 | struct btrfs_path *path; | |
54aa1f4d | 601 | unsigned long off = 0; |
9078a3e1 CM |
602 | |
603 | path = btrfs_alloc_path(); | |
604 | if (!path) | |
605 | return -ENOMEM; | |
606 | ||
607 | while(1) { | |
608 | ret = radix_tree_gang_lookup_tag(radix, (void **)cache, | |
54aa1f4d | 609 | off, ARRAY_SIZE(cache), |
9078a3e1 CM |
610 | BTRFS_BLOCK_GROUP_DIRTY); |
611 | if (!ret) | |
612 | break; | |
613 | for (i = 0; i < ret; i++) { | |
9078a3e1 CM |
614 | err = write_one_cache_group(trans, root, |
615 | path, cache[i]); | |
54aa1f4d CM |
616 | /* |
617 | * if we fail to write the cache group, we want | |
618 | * to keep it marked dirty in hopes that a later | |
619 | * write will work | |
620 | */ | |
621 | if (err) { | |
9078a3e1 | 622 | werr = err; |
54aa1f4d CM |
623 | off = cache[i]->key.objectid + |
624 | cache[i]->key.offset; | |
625 | continue; | |
626 | } | |
627 | ||
628 | radix_tree_tag_clear(radix, cache[i]->key.objectid + | |
629 | cache[i]->key.offset - 1, | |
630 | BTRFS_BLOCK_GROUP_DIRTY); | |
9078a3e1 CM |
631 | } |
632 | } | |
633 | btrfs_free_path(path); | |
634 | return werr; | |
635 | } | |
636 | ||
be744175 CM |
637 | int btrfs_write_dirty_block_groups(struct btrfs_trans_handle *trans, |
638 | struct btrfs_root *root) | |
639 | { | |
640 | int ret; | |
641 | int ret2; | |
642 | ret = write_dirty_block_radix(trans, root, | |
643 | &root->fs_info->block_group_radix); | |
644 | ret2 = write_dirty_block_radix(trans, root, | |
645 | &root->fs_info->block_group_data_radix); | |
646 | if (ret) | |
647 | return ret; | |
648 | if (ret2) | |
649 | return ret2; | |
650 | return 0; | |
651 | } | |
652 | ||
9078a3e1 CM |
653 | static int update_block_group(struct btrfs_trans_handle *trans, |
654 | struct btrfs_root *root, | |
1e2677e0 CM |
655 | u64 blocknr, u64 num, int alloc, int mark_free, |
656 | int data) | |
9078a3e1 CM |
657 | { |
658 | struct btrfs_block_group_cache *cache; | |
659 | struct btrfs_fs_info *info = root->fs_info; | |
660 | u64 total = num; | |
661 | u64 old_val; | |
662 | u64 block_in_group; | |
e37c9e69 | 663 | u64 i; |
1e2677e0 | 664 | int ret; |
3e1ad54f | 665 | |
9078a3e1 | 666 | while(total) { |
5276aeda | 667 | cache = btrfs_lookup_block_group(info, blocknr); |
3e1ad54f | 668 | if (!cache) { |
9078a3e1 | 669 | return -1; |
cd1bc465 | 670 | } |
9078a3e1 CM |
671 | block_in_group = blocknr - cache->key.objectid; |
672 | WARN_ON(block_in_group > cache->key.offset); | |
3e1ad54f | 673 | radix_tree_tag_set(cache->radix, cache->key.objectid + |
be744175 | 674 | cache->key.offset - 1, |
9078a3e1 CM |
675 | BTRFS_BLOCK_GROUP_DIRTY); |
676 | ||
677 | old_val = btrfs_block_group_used(&cache->item); | |
678 | num = min(total, cache->key.offset - block_in_group); | |
cd1bc465 | 679 | if (alloc) { |
cd1bc465 CM |
680 | if (blocknr > cache->last_alloc) |
681 | cache->last_alloc = blocknr; | |
e37c9e69 CM |
682 | if (!cache->data) { |
683 | for (i = 0; i < num; i++) { | |
684 | clear_radix_bit(&info->extent_map_radix, | |
685 | blocknr + i); | |
686 | } | |
687 | } | |
1e2677e0 | 688 | if (cache->data != data && |
84f54cfa | 689 | old_val < (cache->key.offset >> 1)) { |
1e2677e0 CM |
690 | cache->data = data; |
691 | radix_tree_delete(cache->radix, | |
692 | cache->key.objectid + | |
693 | cache->key.offset - 1); | |
694 | ||
695 | if (data) { | |
696 | cache->radix = | |
697 | &info->block_group_data_radix; | |
698 | cache->item.flags |= | |
699 | BTRFS_BLOCK_GROUP_DATA; | |
700 | } else { | |
701 | cache->radix = &info->block_group_radix; | |
702 | cache->item.flags &= | |
703 | ~BTRFS_BLOCK_GROUP_DATA; | |
704 | } | |
705 | ret = radix_tree_insert(cache->radix, | |
706 | cache->key.objectid + | |
707 | cache->key.offset - 1, | |
708 | (void *)cache); | |
709 | } | |
710 | old_val += num; | |
cd1bc465 | 711 | } else { |
9078a3e1 | 712 | old_val -= num; |
cd1bc465 CM |
713 | if (blocknr < cache->first_free) |
714 | cache->first_free = blocknr; | |
e37c9e69 CM |
715 | if (!cache->data && mark_free) { |
716 | for (i = 0; i < num; i++) { | |
717 | set_radix_bit(&info->extent_map_radix, | |
718 | blocknr + i); | |
719 | } | |
720 | } | |
84f54cfa CM |
721 | if (old_val < (cache->key.offset >> 1) && |
722 | old_val + num >= (cache->key.offset >> 1)) { | |
e37c9e69 CM |
723 | radix_tree_tag_set(cache->radix, |
724 | cache->key.objectid + | |
725 | cache->key.offset - 1, | |
726 | BTRFS_BLOCK_GROUP_AVAIL); | |
727 | } | |
cd1bc465 | 728 | } |
9078a3e1 | 729 | btrfs_set_block_group_used(&cache->item, old_val); |
e37c9e69 CM |
730 | total -= num; |
731 | blocknr += num; | |
9078a3e1 CM |
732 | } |
733 | return 0; | |
734 | } | |
735 | ||
be08c1b9 CM |
736 | static int try_remove_page(struct address_space *mapping, unsigned long index) |
737 | { | |
738 | int ret; | |
739 | ret = invalidate_mapping_pages(mapping, index, index); | |
740 | return ret; | |
741 | } | |
742 | ||
ccd467d6 CM |
743 | int btrfs_copy_pinned(struct btrfs_root *root, struct radix_tree_root *copy) |
744 | { | |
745 | unsigned long gang[8]; | |
746 | u64 last = 0; | |
747 | struct radix_tree_root *pinned_radix = &root->fs_info->pinned_radix; | |
748 | int ret; | |
749 | int i; | |
750 | ||
751 | while(1) { | |
752 | ret = find_first_radix_bit(pinned_radix, gang, last, | |
753 | ARRAY_SIZE(gang)); | |
754 | if (!ret) | |
755 | break; | |
756 | for (i = 0 ; i < ret; i++) { | |
757 | set_radix_bit(copy, gang[i]); | |
758 | last = gang[i] + 1; | |
759 | } | |
760 | } | |
761 | return 0; | |
762 | } | |
763 | ||
764 | int btrfs_finish_extent_commit(struct btrfs_trans_handle *trans, | |
765 | struct btrfs_root *root, | |
766 | struct radix_tree_root *unpin_radix) | |
a28ec197 | 767 | { |
8ef97622 | 768 | unsigned long gang[8]; |
be08c1b9 | 769 | struct inode *btree_inode = root->fs_info->btree_inode; |
be744175 | 770 | struct btrfs_block_group_cache *block_group; |
88fd146c | 771 | u64 first = 0; |
a28ec197 CM |
772 | int ret; |
773 | int i; | |
8ef97622 | 774 | struct radix_tree_root *pinned_radix = &root->fs_info->pinned_radix; |
e37c9e69 | 775 | struct radix_tree_root *extent_radix = &root->fs_info->extent_map_radix; |
a28ec197 CM |
776 | |
777 | while(1) { | |
ccd467d6 | 778 | ret = find_first_radix_bit(unpin_radix, gang, 0, |
8ef97622 | 779 | ARRAY_SIZE(gang)); |
a28ec197 CM |
780 | if (!ret) |
781 | break; | |
88fd146c | 782 | if (!first) |
8ef97622 | 783 | first = gang[0]; |
0579da42 | 784 | for (i = 0; i < ret; i++) { |
8ef97622 | 785 | clear_radix_bit(pinned_radix, gang[i]); |
ccd467d6 | 786 | clear_radix_bit(unpin_radix, gang[i]); |
5276aeda CM |
787 | block_group = btrfs_lookup_block_group(root->fs_info, |
788 | gang[i]); | |
be744175 CM |
789 | if (block_group) { |
790 | WARN_ON(block_group->pinned == 0); | |
791 | block_group->pinned--; | |
792 | if (gang[i] < block_group->last_alloc) | |
793 | block_group->last_alloc = gang[i]; | |
e37c9e69 CM |
794 | if (gang[i] < block_group->last_prealloc) |
795 | block_group->last_prealloc = gang[i]; | |
796 | if (!block_group->data) | |
797 | set_radix_bit(extent_radix, gang[i]); | |
be744175 | 798 | } |
be08c1b9 CM |
799 | try_remove_page(btree_inode->i_mapping, |
800 | gang[i] << (PAGE_CACHE_SHIFT - | |
801 | btree_inode->i_blkbits)); | |
0579da42 | 802 | } |
a28ec197 CM |
803 | } |
804 | return 0; | |
805 | } | |
806 | ||
e089f05c CM |
807 | static int finish_current_insert(struct btrfs_trans_handle *trans, struct |
808 | btrfs_root *extent_root) | |
037e6390 | 809 | { |
e2fa7227 | 810 | struct btrfs_key ins; |
234b63a0 | 811 | struct btrfs_extent_item extent_item; |
037e6390 CM |
812 | int i; |
813 | int ret; | |
1261ec42 CM |
814 | u64 super_blocks_used; |
815 | struct btrfs_fs_info *info = extent_root->fs_info; | |
037e6390 | 816 | |
cf27e1ee | 817 | btrfs_set_extent_refs(&extent_item, 1); |
037e6390 CM |
818 | ins.offset = 1; |
819 | ins.flags = 0; | |
62e2749e | 820 | btrfs_set_key_type(&ins, BTRFS_EXTENT_ITEM_KEY); |
5d0c3e60 | 821 | btrfs_set_extent_owner(&extent_item, extent_root->root_key.objectid); |
037e6390 | 822 | |
f2458e1d CM |
823 | for (i = 0; i < extent_root->fs_info->extent_tree_insert_nr; i++) { |
824 | ins.objectid = extent_root->fs_info->extent_tree_insert[i]; | |
4b52dff6 CM |
825 | super_blocks_used = btrfs_super_blocks_used(&info->super_copy); |
826 | btrfs_set_super_blocks_used(&info->super_copy, | |
1261ec42 | 827 | super_blocks_used + 1); |
e089f05c CM |
828 | ret = btrfs_insert_item(trans, extent_root, &ins, &extent_item, |
829 | sizeof(extent_item)); | |
037e6390 CM |
830 | BUG_ON(ret); |
831 | } | |
f2458e1d | 832 | extent_root->fs_info->extent_tree_insert_nr = 0; |
037e6390 CM |
833 | return 0; |
834 | } | |
835 | ||
8ef97622 | 836 | static int pin_down_block(struct btrfs_root *root, u64 blocknr, int pending) |
e20d96d6 CM |
837 | { |
838 | int err; | |
78fae27e | 839 | struct btrfs_header *header; |
8ef97622 CM |
840 | struct buffer_head *bh; |
841 | ||
f4b9aa8d | 842 | if (!pending) { |
d98237b3 | 843 | bh = btrfs_find_tree_block(root, blocknr); |
2c90e5d6 CM |
844 | if (bh) { |
845 | if (buffer_uptodate(bh)) { | |
846 | u64 transid = | |
847 | root->fs_info->running_transaction->transid; | |
848 | header = btrfs_buffer_header(bh); | |
849 | if (btrfs_header_generation(header) == | |
850 | transid) { | |
851 | btrfs_block_release(root, bh); | |
852 | return 0; | |
853 | } | |
f4b9aa8d | 854 | } |
d6025579 | 855 | btrfs_block_release(root, bh); |
8ef97622 | 856 | } |
8ef97622 | 857 | err = set_radix_bit(&root->fs_info->pinned_radix, blocknr); |
be744175 CM |
858 | if (!err) { |
859 | struct btrfs_block_group_cache *cache; | |
5276aeda CM |
860 | cache = btrfs_lookup_block_group(root->fs_info, |
861 | blocknr); | |
be744175 CM |
862 | if (cache) |
863 | cache->pinned++; | |
864 | } | |
f4b9aa8d CM |
865 | } else { |
866 | err = set_radix_bit(&root->fs_info->pending_del_radix, blocknr); | |
867 | } | |
be744175 | 868 | BUG_ON(err < 0); |
e20d96d6 CM |
869 | return 0; |
870 | } | |
871 | ||
fec577fb | 872 | /* |
a28ec197 | 873 | * remove an extent from the root, returns 0 on success |
fec577fb | 874 | */ |
e089f05c | 875 | static int __free_extent(struct btrfs_trans_handle *trans, struct btrfs_root |
e37c9e69 CM |
876 | *root, u64 blocknr, u64 num_blocks, int pin, |
877 | int mark_free) | |
a28ec197 | 878 | { |
5caf2a00 | 879 | struct btrfs_path *path; |
e2fa7227 | 880 | struct btrfs_key key; |
1261ec42 CM |
881 | struct btrfs_fs_info *info = root->fs_info; |
882 | struct btrfs_root *extent_root = info->extent_root; | |
a28ec197 | 883 | int ret; |
234b63a0 | 884 | struct btrfs_extent_item *ei; |
e2fa7227 | 885 | struct btrfs_key ins; |
cf27e1ee | 886 | u32 refs; |
037e6390 | 887 | |
a28ec197 CM |
888 | key.objectid = blocknr; |
889 | key.flags = 0; | |
62e2749e | 890 | btrfs_set_key_type(&key, BTRFS_EXTENT_ITEM_KEY); |
a28ec197 CM |
891 | key.offset = num_blocks; |
892 | ||
5caf2a00 | 893 | path = btrfs_alloc_path(); |
54aa1f4d CM |
894 | if (!path) |
895 | return -ENOMEM; | |
5f26f772 | 896 | |
f2654de4 | 897 | ret = find_free_extent(trans, root, 0, 0, (u64)-1, 0, &ins, 0, 0, 0); |
a28ec197 | 898 | if (ret) { |
54aa1f4d CM |
899 | btrfs_free_path(path); |
900 | return ret; | |
a28ec197 | 901 | } |
54aa1f4d CM |
902 | |
903 | ret = btrfs_search_slot(trans, extent_root, &key, path, -1, 1); | |
904 | if (ret < 0) | |
905 | return ret; | |
906 | BUG_ON(ret); | |
5caf2a00 | 907 | ei = btrfs_item_ptr(btrfs_buffer_leaf(path->nodes[0]), path->slots[0], |
123abc88 | 908 | struct btrfs_extent_item); |
a28ec197 | 909 | BUG_ON(ei->refs == 0); |
cf27e1ee CM |
910 | refs = btrfs_extent_refs(ei) - 1; |
911 | btrfs_set_extent_refs(ei, refs); | |
5caf2a00 | 912 | btrfs_mark_buffer_dirty(path->nodes[0]); |
cf27e1ee | 913 | if (refs == 0) { |
1261ec42 | 914 | u64 super_blocks_used; |
78fae27e CM |
915 | |
916 | if (pin) { | |
8ef97622 | 917 | ret = pin_down_block(root, blocknr, 0); |
78fae27e CM |
918 | BUG_ON(ret); |
919 | } | |
920 | ||
4b52dff6 CM |
921 | super_blocks_used = btrfs_super_blocks_used(&info->super_copy); |
922 | btrfs_set_super_blocks_used(&info->super_copy, | |
1261ec42 | 923 | super_blocks_used - num_blocks); |
5caf2a00 | 924 | ret = btrfs_del_item(trans, extent_root, path); |
54aa1f4d CM |
925 | if (ret) { |
926 | return ret; | |
927 | } | |
e37c9e69 | 928 | ret = update_block_group(trans, root, blocknr, num_blocks, 0, |
1e2677e0 | 929 | mark_free, 0); |
9078a3e1 | 930 | BUG_ON(ret); |
a28ec197 | 931 | } |
5caf2a00 | 932 | btrfs_free_path(path); |
e089f05c | 933 | finish_current_insert(trans, extent_root); |
a28ec197 CM |
934 | return ret; |
935 | } | |
936 | ||
a28ec197 CM |
937 | /* |
938 | * find all the blocks marked as pending in the radix tree and remove | |
939 | * them from the extent map | |
940 | */ | |
e089f05c CM |
941 | static int del_pending_extents(struct btrfs_trans_handle *trans, struct |
942 | btrfs_root *extent_root) | |
a28ec197 CM |
943 | { |
944 | int ret; | |
e20d96d6 CM |
945 | int wret; |
946 | int err = 0; | |
8ef97622 | 947 | unsigned long gang[4]; |
a28ec197 | 948 | int i; |
8ef97622 CM |
949 | struct radix_tree_root *pending_radix; |
950 | struct radix_tree_root *pinned_radix; | |
be744175 | 951 | struct btrfs_block_group_cache *cache; |
8ef97622 CM |
952 | |
953 | pending_radix = &extent_root->fs_info->pending_del_radix; | |
954 | pinned_radix = &extent_root->fs_info->pinned_radix; | |
a28ec197 CM |
955 | |
956 | while(1) { | |
e37c9e69 | 957 | ret = find_first_radix_bit(pending_radix, gang, 0, |
8ef97622 | 958 | ARRAY_SIZE(gang)); |
a28ec197 CM |
959 | if (!ret) |
960 | break; | |
961 | for (i = 0; i < ret; i++) { | |
8ef97622 | 962 | wret = set_radix_bit(pinned_radix, gang[i]); |
be744175 | 963 | if (wret == 0) { |
5276aeda CM |
964 | cache = |
965 | btrfs_lookup_block_group(extent_root->fs_info, | |
be744175 CM |
966 | gang[i]); |
967 | if (cache) | |
968 | cache->pinned++; | |
969 | } | |
970 | if (wret < 0) { | |
971 | printk(KERN_CRIT "set_radix_bit, err %d\n", | |
972 | wret); | |
973 | BUG_ON(wret < 0); | |
974 | } | |
8ef97622 CM |
975 | wret = clear_radix_bit(pending_radix, gang[i]); |
976 | BUG_ON(wret); | |
d5719762 | 977 | wret = __free_extent(trans, extent_root, |
e37c9e69 | 978 | gang[i], 1, 0, 0); |
e20d96d6 CM |
979 | if (wret) |
980 | err = wret; | |
fec577fb CM |
981 | } |
982 | } | |
e20d96d6 | 983 | return err; |
fec577fb CM |
984 | } |
985 | ||
986 | /* | |
987 | * remove an extent from the root, returns 0 on success | |
988 | */ | |
e089f05c CM |
989 | int btrfs_free_extent(struct btrfs_trans_handle *trans, struct btrfs_root |
990 | *root, u64 blocknr, u64 num_blocks, int pin) | |
fec577fb | 991 | { |
9f5fae2f | 992 | struct btrfs_root *extent_root = root->fs_info->extent_root; |
fec577fb CM |
993 | int pending_ret; |
994 | int ret; | |
a28ec197 | 995 | |
fec577fb | 996 | if (root == extent_root) { |
8ef97622 | 997 | pin_down_block(root, blocknr, 1); |
fec577fb CM |
998 | return 0; |
999 | } | |
e37c9e69 | 1000 | ret = __free_extent(trans, root, blocknr, num_blocks, pin, pin == 0); |
e20d96d6 | 1001 | pending_ret = del_pending_extents(trans, root->fs_info->extent_root); |
fec577fb CM |
1002 | return ret ? ret : pending_ret; |
1003 | } | |
1004 | ||
1005 | /* | |
1006 | * walks the btree of allocated extents and find a hole of a given size. | |
1007 | * The key ins is changed to record the hole: | |
1008 | * ins->objectid == block start | |
62e2749e | 1009 | * ins->flags = BTRFS_EXTENT_ITEM_KEY |
fec577fb CM |
1010 | * ins->offset == number of blocks |
1011 | * Any available blocks before search_start are skipped. | |
1012 | */ | |
e089f05c CM |
1013 | static int find_free_extent(struct btrfs_trans_handle *trans, struct btrfs_root |
1014 | *orig_root, u64 num_blocks, u64 search_start, u64 | |
fbdc762b | 1015 | search_end, u64 hint_block, |
f2654de4 CM |
1016 | struct btrfs_key *ins, u64 exclude_start, |
1017 | u64 exclude_nr, int data) | |
fec577fb | 1018 | { |
5caf2a00 | 1019 | struct btrfs_path *path; |
e2fa7227 | 1020 | struct btrfs_key key; |
fec577fb CM |
1021 | int ret; |
1022 | u64 hole_size = 0; | |
1023 | int slot = 0; | |
e20d96d6 | 1024 | u64 last_block = 0; |
037e6390 | 1025 | u64 test_block; |
be744175 | 1026 | u64 orig_search_start = search_start; |
fec577fb | 1027 | int start_found; |
234b63a0 | 1028 | struct btrfs_leaf *l; |
9f5fae2f | 1029 | struct btrfs_root * root = orig_root->fs_info->extent_root; |
f2458e1d | 1030 | struct btrfs_fs_info *info = root->fs_info; |
0579da42 | 1031 | int total_needed = num_blocks; |
f2458e1d CM |
1032 | int total_found = 0; |
1033 | int fill_prealloc = 0; | |
e20d96d6 | 1034 | int level; |
be08c1b9 | 1035 | struct btrfs_block_group_cache *block_group; |
be744175 | 1036 | int full_scan = 0; |
fbdc762b | 1037 | int wrapped = 0; |
de428b63 | 1038 | u64 limit; |
fec577fb | 1039 | |
b1a4d965 CM |
1040 | ins->flags = 0; |
1041 | btrfs_set_key_type(ins, BTRFS_EXTENT_ITEM_KEY); | |
1042 | ||
e20d96d6 | 1043 | level = btrfs_header_level(btrfs_buffer_header(root->node)); |
f2458e1d CM |
1044 | if (num_blocks == 0) { |
1045 | fill_prealloc = 1; | |
1046 | num_blocks = 1; | |
308535a0 | 1047 | total_needed = (min(level + 1, BTRFS_MAX_LEVEL) + 2) * 3; |
f2458e1d | 1048 | } |
85e55b13 CM |
1049 | if (fill_prealloc) { |
1050 | u64 first; | |
1051 | int nr = info->extent_tree_prealloc_nr; | |
1052 | first = info->extent_tree_prealloc[nr - 1]; | |
1053 | if (info->extent_tree_prealloc_nr >= total_needed && | |
1054 | first >= search_start) { | |
1055 | ins->objectid = info->extent_tree_prealloc[0]; | |
1056 | ins->offset = 1; | |
1057 | return 0; | |
1058 | } | |
1059 | info->extent_tree_prealloc_nr = 0; | |
1060 | } | |
3e1ad54f | 1061 | if (search_end == (u64)-1) |
4b52dff6 | 1062 | search_end = btrfs_super_total_blocks(&info->super_copy); |
fbdc762b | 1063 | if (hint_block) { |
5276aeda | 1064 | block_group = btrfs_lookup_block_group(info, hint_block); |
be744175 | 1065 | block_group = btrfs_find_block_group(root, block_group, |
fbdc762b | 1066 | hint_block, data, 1); |
be744175 CM |
1067 | } else { |
1068 | block_group = btrfs_find_block_group(root, | |
1069 | trans->block_group, 0, | |
de428b63 | 1070 | data, 1); |
be744175 CM |
1071 | } |
1072 | ||
e011599b CM |
1073 | path = btrfs_alloc_path(); |
1074 | ||
be744175 | 1075 | check_failed: |
1e2677e0 | 1076 | if (!block_group->data) |
e37c9e69 CM |
1077 | search_start = find_search_start(root, &block_group, |
1078 | search_start, total_needed); | |
fbdc762b | 1079 | else if (!full_scan) |
e37c9e69 CM |
1080 | search_start = max(block_group->last_alloc, search_start); |
1081 | ||
5caf2a00 | 1082 | btrfs_init_path(path); |
fec577fb CM |
1083 | ins->objectid = search_start; |
1084 | ins->offset = 0; | |
fec577fb | 1085 | start_found = 0; |
e37c9e69 | 1086 | |
5caf2a00 | 1087 | ret = btrfs_search_slot(trans, root, ins, path, 0, 0); |
0f70abe2 CM |
1088 | if (ret < 0) |
1089 | goto error; | |
aa5d6bed | 1090 | |
e37c9e69 | 1091 | if (path->slots[0] > 0) { |
5caf2a00 | 1092 | path->slots[0]--; |
e37c9e69 CM |
1093 | } |
1094 | ||
1095 | l = btrfs_buffer_leaf(path->nodes[0]); | |
1096 | btrfs_disk_key_to_cpu(&key, &l->items[path->slots[0]].key); | |
1097 | /* | |
1098 | * a rare case, go back one key if we hit a block group item | |
1099 | * instead of an extent item | |
1100 | */ | |
1101 | if (btrfs_key_type(&key) != BTRFS_EXTENT_ITEM_KEY && | |
1102 | key.objectid + key.offset >= search_start) { | |
1103 | ins->objectid = key.objectid; | |
1104 | ins->offset = key.offset - 1; | |
1105 | btrfs_release_path(root, path); | |
1106 | ret = btrfs_search_slot(trans, root, ins, path, 0, 0); | |
1107 | if (ret < 0) | |
1108 | goto error; | |
1109 | ||
1110 | if (path->slots[0] > 0) { | |
1111 | path->slots[0]--; | |
1112 | } | |
1113 | } | |
0579da42 | 1114 | |
fec577fb | 1115 | while (1) { |
5caf2a00 CM |
1116 | l = btrfs_buffer_leaf(path->nodes[0]); |
1117 | slot = path->slots[0]; | |
7518a238 | 1118 | if (slot >= btrfs_header_nritems(&l->header)) { |
f2458e1d CM |
1119 | if (fill_prealloc) { |
1120 | info->extent_tree_prealloc_nr = 0; | |
1121 | total_found = 0; | |
1122 | } | |
de428b63 CM |
1123 | if (start_found) |
1124 | limit = last_block + | |
84f54cfa | 1125 | (block_group->key.offset >> 1); |
de428b63 CM |
1126 | else |
1127 | limit = search_start + | |
84f54cfa | 1128 | (block_group->key.offset >> 1); |
5caf2a00 | 1129 | ret = btrfs_next_leaf(root, path); |
fec577fb CM |
1130 | if (ret == 0) |
1131 | continue; | |
0f70abe2 CM |
1132 | if (ret < 0) |
1133 | goto error; | |
fec577fb CM |
1134 | if (!start_found) { |
1135 | ins->objectid = search_start; | |
3e1ad54f | 1136 | ins->offset = search_end - search_start; |
fec577fb CM |
1137 | start_found = 1; |
1138 | goto check_pending; | |
1139 | } | |
1140 | ins->objectid = last_block > search_start ? | |
1141 | last_block : search_start; | |
3e1ad54f | 1142 | ins->offset = search_end - ins->objectid; |
fec577fb CM |
1143 | goto check_pending; |
1144 | } | |
e37c9e69 | 1145 | |
e2fa7227 | 1146 | btrfs_disk_key_to_cpu(&key, &l->items[slot].key); |
e37c9e69 CM |
1147 | if (key.objectid >= search_start && key.objectid > last_block && |
1148 | start_found) { | |
1149 | if (last_block < search_start) | |
1150 | last_block = search_start; | |
1151 | hole_size = key.objectid - last_block; | |
1152 | if (hole_size >= num_blocks) { | |
1153 | ins->objectid = last_block; | |
1154 | ins->offset = hole_size; | |
1155 | goto check_pending; | |
0579da42 | 1156 | } |
fec577fb | 1157 | } |
e37c9e69 CM |
1158 | |
1159 | if (btrfs_key_type(&key) != BTRFS_EXTENT_ITEM_KEY) | |
1160 | goto next; | |
1161 | ||
0579da42 | 1162 | start_found = 1; |
e2fa7227 | 1163 | last_block = key.objectid + key.offset; |
fbdc762b | 1164 | if (!full_scan && last_block >= block_group->key.objectid + |
be744175 CM |
1165 | block_group->key.offset) { |
1166 | btrfs_release_path(root, path); | |
1167 | search_start = block_group->key.objectid + | |
1168 | block_group->key.offset * 2; | |
1169 | goto new_group; | |
1170 | } | |
9078a3e1 | 1171 | next: |
5caf2a00 | 1172 | path->slots[0]++; |
de428b63 | 1173 | cond_resched(); |
fec577fb | 1174 | } |
fec577fb CM |
1175 | check_pending: |
1176 | /* we have to make sure we didn't find an extent that has already | |
1177 | * been allocated by the map tree or the original allocation | |
1178 | */ | |
5caf2a00 | 1179 | btrfs_release_path(root, path); |
fec577fb | 1180 | BUG_ON(ins->objectid < search_start); |
e37c9e69 | 1181 | |
3e1ad54f | 1182 | if (ins->objectid + num_blocks >= search_end) { |
fbdc762b CM |
1183 | if (full_scan) { |
1184 | ret = -ENOSPC; | |
1185 | goto error; | |
1186 | } | |
be744175 | 1187 | search_start = orig_search_start; |
fbdc762b CM |
1188 | if (wrapped) |
1189 | full_scan = 1; | |
1190 | else | |
1191 | wrapped = 1; | |
be744175 | 1192 | goto new_group; |
06a2f9fa | 1193 | } |
037e6390 | 1194 | for (test_block = ins->objectid; |
f2458e1d CM |
1195 | test_block < ins->objectid + num_blocks; test_block++) { |
1196 | if (test_radix_bit(&info->pinned_radix, test_block)) { | |
037e6390 | 1197 | search_start = test_block + 1; |
be744175 | 1198 | goto new_group; |
fec577fb CM |
1199 | } |
1200 | } | |
f2458e1d CM |
1201 | if (!fill_prealloc && info->extent_tree_insert_nr) { |
1202 | u64 last = | |
1203 | info->extent_tree_insert[info->extent_tree_insert_nr - 1]; | |
1204 | if (ins->objectid + num_blocks > | |
1205 | info->extent_tree_insert[0] && | |
1206 | ins->objectid <= last) { | |
1207 | search_start = last + 1; | |
e37c9e69 | 1208 | WARN_ON(!full_scan); |
be744175 | 1209 | goto new_group; |
f2458e1d CM |
1210 | } |
1211 | } | |
1212 | if (!fill_prealloc && info->extent_tree_prealloc_nr) { | |
1213 | u64 first = | |
1214 | info->extent_tree_prealloc[info->extent_tree_prealloc_nr - 1]; | |
1215 | if (ins->objectid + num_blocks > first && | |
1216 | ins->objectid <= info->extent_tree_prealloc[0]) { | |
1217 | search_start = info->extent_tree_prealloc[0] + 1; | |
be744175 | 1218 | goto new_group; |
f2458e1d CM |
1219 | } |
1220 | } | |
f2654de4 CM |
1221 | if (exclude_nr > 0 && (ins->objectid + num_blocks > exclude_start && |
1222 | ins->objectid < exclude_start + exclude_nr)) { | |
1223 | search_start = exclude_start + exclude_nr; | |
1224 | goto new_group; | |
1225 | } | |
f2458e1d CM |
1226 | if (fill_prealloc) { |
1227 | int nr; | |
1228 | test_block = ins->objectid; | |
e37c9e69 CM |
1229 | if (test_block - info->extent_tree_prealloc[total_needed - 1] >= |
1230 | leaf_range(root)) { | |
1231 | total_found = 0; | |
1232 | info->extent_tree_prealloc_nr = total_found; | |
1233 | } | |
f2458e1d CM |
1234 | while(test_block < ins->objectid + ins->offset && |
1235 | total_found < total_needed) { | |
1236 | nr = total_needed - total_found - 1; | |
1237 | BUG_ON(nr < 0); | |
cd1bc465 | 1238 | info->extent_tree_prealloc[nr] = test_block; |
f2458e1d CM |
1239 | total_found++; |
1240 | test_block++; | |
1241 | } | |
1242 | if (total_found < total_needed) { | |
1243 | search_start = test_block; | |
be744175 | 1244 | goto new_group; |
f2458e1d | 1245 | } |
cd1bc465 CM |
1246 | info->extent_tree_prealloc_nr = total_found; |
1247 | } | |
e37c9e69 | 1248 | if (!data) { |
5276aeda | 1249 | block_group = btrfs_lookup_block_group(info, ins->objectid); |
e37c9e69 CM |
1250 | if (block_group) { |
1251 | if (fill_prealloc) | |
1252 | block_group->last_prealloc = | |
1253 | info->extent_tree_prealloc[total_needed-1]; | |
1254 | else | |
1255 | trans->block_group = block_group; | |
1256 | } | |
f2458e1d | 1257 | } |
037e6390 | 1258 | ins->offset = num_blocks; |
5caf2a00 | 1259 | btrfs_free_path(path); |
fec577fb | 1260 | return 0; |
be744175 CM |
1261 | |
1262 | new_group: | |
3e1ad54f | 1263 | if (search_start + num_blocks >= search_end) { |
be744175 | 1264 | search_start = orig_search_start; |
fbdc762b CM |
1265 | if (full_scan) { |
1266 | ret = -ENOSPC; | |
1267 | goto error; | |
1268 | } | |
1269 | if (wrapped) | |
1270 | full_scan = 1; | |
1271 | else | |
1272 | wrapped = 1; | |
be744175 | 1273 | } |
5276aeda | 1274 | block_group = btrfs_lookup_block_group(info, search_start); |
fbdc762b | 1275 | cond_resched(); |
be744175 CM |
1276 | if (!full_scan) |
1277 | block_group = btrfs_find_block_group(root, block_group, | |
de428b63 | 1278 | search_start, data, 0); |
be744175 CM |
1279 | goto check_failed; |
1280 | ||
0f70abe2 | 1281 | error: |
5caf2a00 CM |
1282 | btrfs_release_path(root, path); |
1283 | btrfs_free_path(path); | |
0f70abe2 | 1284 | return ret; |
fec577fb | 1285 | } |
fec577fb CM |
1286 | /* |
1287 | * finds a free extent and does all the dirty work required for allocation | |
1288 | * returns the key for the extent through ins, and a tree buffer for | |
1289 | * the first block of the extent through buf. | |
1290 | * | |
1291 | * returns 0 if everything worked, non-zero otherwise. | |
1292 | */ | |
4d775673 CM |
1293 | int btrfs_alloc_extent(struct btrfs_trans_handle *trans, |
1294 | struct btrfs_root *root, u64 owner, | |
fbdc762b | 1295 | u64 num_blocks, u64 hint_block, |
be08c1b9 | 1296 | u64 search_end, struct btrfs_key *ins, int data) |
fec577fb CM |
1297 | { |
1298 | int ret; | |
1299 | int pending_ret; | |
1261ec42 | 1300 | u64 super_blocks_used; |
fbdc762b | 1301 | u64 search_start = 0; |
f2654de4 CM |
1302 | u64 exclude_start = 0; |
1303 | u64 exclude_nr = 0; | |
1261ec42 CM |
1304 | struct btrfs_fs_info *info = root->fs_info; |
1305 | struct btrfs_root *extent_root = info->extent_root; | |
234b63a0 | 1306 | struct btrfs_extent_item extent_item; |
f2458e1d | 1307 | struct btrfs_key prealloc_key; |
037e6390 | 1308 | |
cf27e1ee | 1309 | btrfs_set_extent_refs(&extent_item, 1); |
4d775673 | 1310 | btrfs_set_extent_owner(&extent_item, owner); |
fec577fb | 1311 | |
037e6390 | 1312 | if (root == extent_root) { |
f2458e1d CM |
1313 | int nr; |
1314 | BUG_ON(info->extent_tree_prealloc_nr == 0); | |
037e6390 | 1315 | BUG_ON(num_blocks != 1); |
037e6390 | 1316 | ins->offset = 1; |
f2458e1d CM |
1317 | info->extent_tree_prealloc_nr--; |
1318 | nr = info->extent_tree_prealloc_nr; | |
1319 | ins->objectid = info->extent_tree_prealloc[nr]; | |
1320 | info->extent_tree_insert[info->extent_tree_insert_nr++] = | |
1321 | ins->objectid; | |
9078a3e1 | 1322 | ret = update_block_group(trans, root, |
1e2677e0 | 1323 | ins->objectid, ins->offset, 1, 0, 0); |
9078a3e1 | 1324 | BUG_ON(ret); |
fec577fb CM |
1325 | return 0; |
1326 | } | |
e37c9e69 CM |
1327 | |
1328 | /* | |
1329 | * if we're doing a data allocation, preallocate room in the | |
1330 | * extent tree first. This way the extent tree blocks end up | |
1331 | * in the correct block group. | |
1332 | */ | |
1333 | if (data) { | |
de428b63 | 1334 | ret = find_free_extent(trans, root, 0, 0, |
f2654de4 | 1335 | search_end, 0, &prealloc_key, 0, 0, 0); |
ccd467d6 | 1336 | BUG_ON(ret); |
f2654de4 | 1337 | if (ret) |
e37c9e69 | 1338 | return ret; |
f2654de4 CM |
1339 | exclude_nr = info->extent_tree_prealloc_nr; |
1340 | exclude_start = info->extent_tree_prealloc[exclude_nr - 1]; | |
e37c9e69 | 1341 | } |
f2654de4 | 1342 | |
f2458e1d | 1343 | /* do the real allocation */ |
e089f05c | 1344 | ret = find_free_extent(trans, root, num_blocks, search_start, |
f2654de4 CM |
1345 | search_end, hint_block, ins, |
1346 | exclude_start, exclude_nr, data); | |
ccd467d6 | 1347 | BUG_ON(ret); |
f2654de4 CM |
1348 | if (ret) |
1349 | return ret; | |
fec577fb | 1350 | |
e37c9e69 CM |
1351 | /* |
1352 | * if we're doing a metadata allocation, preallocate space in the | |
1353 | * extent tree second. This way, we don't create a tiny hole | |
1354 | * in the allocation map between any unused preallocation blocks | |
1355 | * and the metadata block we're actually allocating. On disk, | |
1356 | * it'll go: | |
1357 | * [block we've allocated], [used prealloc 1], [ unused prealloc ] | |
1358 | * The unused prealloc will get reused the next time around. | |
1359 | */ | |
1360 | if (!data) { | |
f2654de4 CM |
1361 | exclude_start = ins->objectid; |
1362 | exclude_nr = ins->offset; | |
ccd467d6 | 1363 | hint_block = exclude_start + exclude_nr; |
e37c9e69 | 1364 | ret = find_free_extent(trans, root, 0, search_start, |
fbdc762b | 1365 | search_end, hint_block, |
f2654de4 CM |
1366 | &prealloc_key, exclude_start, |
1367 | exclude_nr, 0); | |
ccd467d6 | 1368 | BUG_ON(ret); |
f2654de4 CM |
1369 | if (ret) |
1370 | return ret; | |
e37c9e69 | 1371 | } |
f2458e1d | 1372 | |
4b52dff6 CM |
1373 | super_blocks_used = btrfs_super_blocks_used(&info->super_copy); |
1374 | btrfs_set_super_blocks_used(&info->super_copy, super_blocks_used + | |
1261ec42 | 1375 | num_blocks); |
e089f05c CM |
1376 | ret = btrfs_insert_item(trans, extent_root, ins, &extent_item, |
1377 | sizeof(extent_item)); | |
037e6390 | 1378 | |
ccd467d6 | 1379 | BUG_ON(ret); |
e089f05c | 1380 | finish_current_insert(trans, extent_root); |
e20d96d6 | 1381 | pending_ret = del_pending_extents(trans, extent_root); |
e37c9e69 | 1382 | if (ret) { |
037e6390 | 1383 | return ret; |
e37c9e69 CM |
1384 | } |
1385 | if (pending_ret) { | |
037e6390 | 1386 | return pending_ret; |
e37c9e69 | 1387 | } |
1e2677e0 CM |
1388 | ret = update_block_group(trans, root, ins->objectid, ins->offset, 1, 0, |
1389 | data); | |
fabb5681 | 1390 | BUG_ON(ret); |
037e6390 | 1391 | return 0; |
fec577fb CM |
1392 | } |
1393 | ||
1394 | /* | |
1395 | * helper function to allocate a block for a given tree | |
1396 | * returns the tree buffer or NULL. | |
1397 | */ | |
e20d96d6 | 1398 | struct buffer_head *btrfs_alloc_free_block(struct btrfs_trans_handle *trans, |
31f3c99b | 1399 | struct btrfs_root *root, u64 hint) |
fec577fb | 1400 | { |
e2fa7227 | 1401 | struct btrfs_key ins; |
fec577fb | 1402 | int ret; |
e20d96d6 | 1403 | struct buffer_head *buf; |
fec577fb | 1404 | |
4d775673 | 1405 | ret = btrfs_alloc_extent(trans, root, root->root_key.objectid, |
de428b63 | 1406 | 1, hint, (unsigned long)-1, &ins, 0); |
fec577fb | 1407 | if (ret) { |
54aa1f4d CM |
1408 | BUG_ON(ret > 0); |
1409 | return ERR_PTR(ret); | |
fec577fb | 1410 | } |
d98237b3 | 1411 | buf = btrfs_find_create_tree_block(root, ins.objectid); |
54aa1f4d CM |
1412 | if (!buf) { |
1413 | btrfs_free_extent(trans, root, ins.objectid, 1, 0); | |
1414 | return ERR_PTR(-ENOMEM); | |
1415 | } | |
df2ce34c | 1416 | set_buffer_uptodate(buf); |
090d1875 | 1417 | set_buffer_checked(buf); |
7c4452b9 | 1418 | set_radix_bit(&trans->transaction->dirty_pages, buf->b_page->index); |
fec577fb CM |
1419 | return buf; |
1420 | } | |
a28ec197 | 1421 | |
6407bf6d CM |
1422 | static int drop_leaf_ref(struct btrfs_trans_handle *trans, |
1423 | struct btrfs_root *root, struct buffer_head *cur) | |
1424 | { | |
1425 | struct btrfs_disk_key *key; | |
1426 | struct btrfs_leaf *leaf; | |
1427 | struct btrfs_file_extent_item *fi; | |
1428 | int i; | |
1429 | int nritems; | |
1430 | int ret; | |
1431 | ||
1432 | BUG_ON(!btrfs_is_leaf(btrfs_buffer_node(cur))); | |
1433 | leaf = btrfs_buffer_leaf(cur); | |
1434 | nritems = btrfs_header_nritems(&leaf->header); | |
1435 | for (i = 0; i < nritems; i++) { | |
3a686375 | 1436 | u64 disk_blocknr; |
6407bf6d CM |
1437 | key = &leaf->items[i].key; |
1438 | if (btrfs_disk_key_type(key) != BTRFS_EXTENT_DATA_KEY) | |
1439 | continue; | |
1440 | fi = btrfs_item_ptr(leaf, i, struct btrfs_file_extent_item); | |
236454df CM |
1441 | if (btrfs_file_extent_type(fi) == BTRFS_FILE_EXTENT_INLINE) |
1442 | continue; | |
6407bf6d CM |
1443 | /* |
1444 | * FIXME make sure to insert a trans record that | |
1445 | * repeats the snapshot del on crash | |
1446 | */ | |
3a686375 CM |
1447 | disk_blocknr = btrfs_file_extent_disk_blocknr(fi); |
1448 | if (disk_blocknr == 0) | |
1449 | continue; | |
1450 | ret = btrfs_free_extent(trans, root, disk_blocknr, | |
6407bf6d CM |
1451 | btrfs_file_extent_disk_num_blocks(fi), |
1452 | 0); | |
1453 | BUG_ON(ret); | |
1454 | } | |
1455 | return 0; | |
1456 | } | |
1457 | ||
e011599b CM |
1458 | static void reada_walk_down(struct btrfs_root *root, |
1459 | struct btrfs_node *node) | |
1460 | { | |
1461 | int i; | |
1462 | u32 nritems; | |
1463 | u64 blocknr; | |
1464 | int ret; | |
1465 | u32 refs; | |
1466 | ||
1467 | nritems = btrfs_header_nritems(&node->header); | |
1468 | for (i = 0; i < nritems; i++) { | |
1469 | blocknr = btrfs_node_blockptr(node, i); | |
1470 | ret = lookup_extent_ref(NULL, root, blocknr, 1, &refs); | |
1471 | BUG_ON(ret); | |
1472 | if (refs != 1) | |
1473 | continue; | |
1474 | ret = readahead_tree_block(root, blocknr); | |
1475 | if (ret) | |
1476 | break; | |
1477 | } | |
1478 | } | |
1479 | ||
9aca1d51 CM |
1480 | /* |
1481 | * helper function for drop_snapshot, this walks down the tree dropping ref | |
1482 | * counts as it goes. | |
1483 | */ | |
e089f05c CM |
1484 | static int walk_down_tree(struct btrfs_trans_handle *trans, struct btrfs_root |
1485 | *root, struct btrfs_path *path, int *level) | |
20524f02 | 1486 | { |
e20d96d6 CM |
1487 | struct buffer_head *next; |
1488 | struct buffer_head *cur; | |
20524f02 CM |
1489 | u64 blocknr; |
1490 | int ret; | |
1491 | u32 refs; | |
1492 | ||
5caf2a00 CM |
1493 | WARN_ON(*level < 0); |
1494 | WARN_ON(*level >= BTRFS_MAX_LEVEL); | |
b18c6685 | 1495 | ret = lookup_extent_ref(trans, root, bh_blocknr(path->nodes[*level]), |
6407bf6d | 1496 | 1, &refs); |
20524f02 CM |
1497 | BUG_ON(ret); |
1498 | if (refs > 1) | |
1499 | goto out; | |
e011599b | 1500 | |
9aca1d51 CM |
1501 | /* |
1502 | * walk down to the last node level and free all the leaves | |
1503 | */ | |
6407bf6d | 1504 | while(*level >= 0) { |
5caf2a00 CM |
1505 | WARN_ON(*level < 0); |
1506 | WARN_ON(*level >= BTRFS_MAX_LEVEL); | |
20524f02 | 1507 | cur = path->nodes[*level]; |
e011599b CM |
1508 | |
1509 | if (*level > 0 && path->slots[*level] == 0) | |
1510 | reada_walk_down(root, btrfs_buffer_node(cur)); | |
1511 | ||
2c90e5d6 CM |
1512 | if (btrfs_header_level(btrfs_buffer_header(cur)) != *level) |
1513 | WARN_ON(1); | |
e011599b | 1514 | |
7518a238 | 1515 | if (path->slots[*level] >= |
e20d96d6 | 1516 | btrfs_header_nritems(btrfs_buffer_header(cur))) |
20524f02 | 1517 | break; |
6407bf6d CM |
1518 | if (*level == 0) { |
1519 | ret = drop_leaf_ref(trans, root, cur); | |
1520 | BUG_ON(ret); | |
1521 | break; | |
1522 | } | |
e20d96d6 CM |
1523 | blocknr = btrfs_node_blockptr(btrfs_buffer_node(cur), |
1524 | path->slots[*level]); | |
b18c6685 | 1525 | ret = lookup_extent_ref(trans, root, blocknr, 1, &refs); |
6407bf6d CM |
1526 | BUG_ON(ret); |
1527 | if (refs != 1) { | |
20524f02 | 1528 | path->slots[*level]++; |
e089f05c | 1529 | ret = btrfs_free_extent(trans, root, blocknr, 1, 1); |
20524f02 CM |
1530 | BUG_ON(ret); |
1531 | continue; | |
1532 | } | |
20524f02 | 1533 | next = read_tree_block(root, blocknr); |
5caf2a00 | 1534 | WARN_ON(*level <= 0); |
83e15a28 | 1535 | if (path->nodes[*level-1]) |
234b63a0 | 1536 | btrfs_block_release(root, path->nodes[*level-1]); |
20524f02 | 1537 | path->nodes[*level-1] = next; |
e20d96d6 | 1538 | *level = btrfs_header_level(btrfs_buffer_header(next)); |
20524f02 CM |
1539 | path->slots[*level] = 0; |
1540 | } | |
1541 | out: | |
5caf2a00 CM |
1542 | WARN_ON(*level < 0); |
1543 | WARN_ON(*level >= BTRFS_MAX_LEVEL); | |
6407bf6d | 1544 | ret = btrfs_free_extent(trans, root, |
7eccb903 | 1545 | bh_blocknr(path->nodes[*level]), 1, 1); |
234b63a0 | 1546 | btrfs_block_release(root, path->nodes[*level]); |
20524f02 CM |
1547 | path->nodes[*level] = NULL; |
1548 | *level += 1; | |
1549 | BUG_ON(ret); | |
1550 | return 0; | |
1551 | } | |
1552 | ||
9aca1d51 CM |
1553 | /* |
1554 | * helper for dropping snapshots. This walks back up the tree in the path | |
1555 | * to find the first node higher up where we haven't yet gone through | |
1556 | * all the slots | |
1557 | */ | |
e089f05c CM |
1558 | static int walk_up_tree(struct btrfs_trans_handle *trans, struct btrfs_root |
1559 | *root, struct btrfs_path *path, int *level) | |
20524f02 CM |
1560 | { |
1561 | int i; | |
1562 | int slot; | |
1563 | int ret; | |
234b63a0 | 1564 | for(i = *level; i < BTRFS_MAX_LEVEL - 1 && path->nodes[i]; i++) { |
20524f02 | 1565 | slot = path->slots[i]; |
e20d96d6 CM |
1566 | if (slot < btrfs_header_nritems( |
1567 | btrfs_buffer_header(path->nodes[i])) - 1) { | |
20524f02 CM |
1568 | path->slots[i]++; |
1569 | *level = i; | |
1570 | return 0; | |
1571 | } else { | |
e089f05c | 1572 | ret = btrfs_free_extent(trans, root, |
7eccb903 | 1573 | bh_blocknr(path->nodes[*level]), |
e089f05c | 1574 | 1, 1); |
6407bf6d | 1575 | BUG_ON(ret); |
234b63a0 | 1576 | btrfs_block_release(root, path->nodes[*level]); |
83e15a28 | 1577 | path->nodes[*level] = NULL; |
20524f02 | 1578 | *level = i + 1; |
20524f02 CM |
1579 | } |
1580 | } | |
1581 | return 1; | |
1582 | } | |
1583 | ||
9aca1d51 CM |
1584 | /* |
1585 | * drop the reference count on the tree rooted at 'snap'. This traverses | |
1586 | * the tree freeing any blocks that have a ref count of zero after being | |
1587 | * decremented. | |
1588 | */ | |
e089f05c | 1589 | int btrfs_drop_snapshot(struct btrfs_trans_handle *trans, struct btrfs_root |
e20d96d6 | 1590 | *root, struct buffer_head *snap) |
20524f02 | 1591 | { |
3768f368 | 1592 | int ret = 0; |
9aca1d51 | 1593 | int wret; |
20524f02 | 1594 | int level; |
5caf2a00 | 1595 | struct btrfs_path *path; |
20524f02 CM |
1596 | int i; |
1597 | int orig_level; | |
1598 | ||
5caf2a00 CM |
1599 | path = btrfs_alloc_path(); |
1600 | BUG_ON(!path); | |
20524f02 | 1601 | |
e20d96d6 | 1602 | level = btrfs_header_level(btrfs_buffer_header(snap)); |
20524f02 | 1603 | orig_level = level; |
5caf2a00 CM |
1604 | path->nodes[level] = snap; |
1605 | path->slots[level] = 0; | |
20524f02 | 1606 | while(1) { |
5caf2a00 | 1607 | wret = walk_down_tree(trans, root, path, &level); |
9aca1d51 | 1608 | if (wret > 0) |
20524f02 | 1609 | break; |
9aca1d51 CM |
1610 | if (wret < 0) |
1611 | ret = wret; | |
1612 | ||
5caf2a00 | 1613 | wret = walk_up_tree(trans, root, path, &level); |
9aca1d51 | 1614 | if (wret > 0) |
20524f02 | 1615 | break; |
9aca1d51 CM |
1616 | if (wret < 0) |
1617 | ret = wret; | |
20524f02 | 1618 | } |
83e15a28 | 1619 | for (i = 0; i <= orig_level; i++) { |
5caf2a00 CM |
1620 | if (path->nodes[i]) { |
1621 | btrfs_block_release(root, path->nodes[i]); | |
83e15a28 | 1622 | } |
20524f02 | 1623 | } |
5caf2a00 | 1624 | btrfs_free_path(path); |
9aca1d51 | 1625 | return ret; |
20524f02 | 1626 | } |
9078a3e1 | 1627 | |
be744175 | 1628 | static int free_block_group_radix(struct radix_tree_root *radix) |
9078a3e1 CM |
1629 | { |
1630 | int ret; | |
1631 | struct btrfs_block_group_cache *cache[8]; | |
1632 | int i; | |
1633 | ||
1634 | while(1) { | |
be744175 | 1635 | ret = radix_tree_gang_lookup(radix, (void **)cache, 0, |
9078a3e1 CM |
1636 | ARRAY_SIZE(cache)); |
1637 | if (!ret) | |
1638 | break; | |
1639 | for (i = 0; i < ret; i++) { | |
be744175 | 1640 | radix_tree_delete(radix, cache[i]->key.objectid + |
9078a3e1 CM |
1641 | cache[i]->key.offset - 1); |
1642 | kfree(cache[i]); | |
1643 | } | |
1644 | } | |
1645 | return 0; | |
1646 | } | |
1647 | ||
be744175 CM |
1648 | int btrfs_free_block_groups(struct btrfs_fs_info *info) |
1649 | { | |
1650 | int ret; | |
1651 | int ret2; | |
e37c9e69 CM |
1652 | unsigned long gang[16]; |
1653 | int i; | |
be744175 CM |
1654 | |
1655 | ret = free_block_group_radix(&info->block_group_radix); | |
1656 | ret2 = free_block_group_radix(&info->block_group_data_radix); | |
1657 | if (ret) | |
1658 | return ret; | |
1659 | if (ret2) | |
1660 | return ret2; | |
e37c9e69 CM |
1661 | |
1662 | while(1) { | |
1663 | ret = find_first_radix_bit(&info->extent_map_radix, | |
1664 | gang, 0, ARRAY_SIZE(gang)); | |
1665 | if (!ret) | |
1666 | break; | |
1667 | for (i = 0; i < ret; i++) { | |
1668 | clear_radix_bit(&info->extent_map_radix, gang[i]); | |
1669 | } | |
1670 | } | |
be744175 CM |
1671 | return 0; |
1672 | } | |
1673 | ||
9078a3e1 CM |
1674 | int btrfs_read_block_groups(struct btrfs_root *root) |
1675 | { | |
1676 | struct btrfs_path *path; | |
1677 | int ret; | |
1678 | int err = 0; | |
1679 | struct btrfs_block_group_item *bi; | |
1680 | struct btrfs_block_group_cache *cache; | |
be744175 CM |
1681 | struct btrfs_fs_info *info = root->fs_info; |
1682 | struct radix_tree_root *radix; | |
9078a3e1 CM |
1683 | struct btrfs_key key; |
1684 | struct btrfs_key found_key; | |
1685 | struct btrfs_leaf *leaf; | |
84f54cfa | 1686 | u64 group_size_blocks; |
31f3c99b | 1687 | u64 used; |
9078a3e1 | 1688 | |
84f54cfa CM |
1689 | group_size_blocks = BTRFS_BLOCK_GROUP_SIZE >> |
1690 | root->fs_info->sb->s_blocksize_bits; | |
be744175 | 1691 | root = info->extent_root; |
9078a3e1 CM |
1692 | key.objectid = 0; |
1693 | key.offset = group_size_blocks; | |
1694 | key.flags = 0; | |
1695 | btrfs_set_key_type(&key, BTRFS_BLOCK_GROUP_ITEM_KEY); | |
1696 | ||
1697 | path = btrfs_alloc_path(); | |
1698 | if (!path) | |
1699 | return -ENOMEM; | |
1700 | ||
1701 | while(1) { | |
be744175 | 1702 | ret = btrfs_search_slot(NULL, info->extent_root, |
9078a3e1 CM |
1703 | &key, path, 0, 0); |
1704 | if (ret != 0) { | |
1705 | err = ret; | |
1706 | break; | |
1707 | } | |
1708 | leaf = btrfs_buffer_leaf(path->nodes[0]); | |
1709 | btrfs_disk_key_to_cpu(&found_key, | |
1710 | &leaf->items[path->slots[0]].key); | |
1711 | cache = kmalloc(sizeof(*cache), GFP_NOFS); | |
1712 | if (!cache) { | |
1713 | err = -1; | |
1714 | break; | |
1715 | } | |
3e1ad54f | 1716 | |
1e2677e0 CM |
1717 | bi = btrfs_item_ptr(leaf, path->slots[0], |
1718 | struct btrfs_block_group_item); | |
1719 | if (bi->flags & BTRFS_BLOCK_GROUP_DATA) { | |
3e1ad54f | 1720 | radix = &info->block_group_data_radix; |
1e2677e0 CM |
1721 | cache->data = 1; |
1722 | } else { | |
3e1ad54f | 1723 | radix = &info->block_group_radix; |
1e2677e0 CM |
1724 | cache->data = 0; |
1725 | } | |
3e1ad54f | 1726 | |
9078a3e1 CM |
1727 | memcpy(&cache->item, bi, sizeof(*bi)); |
1728 | memcpy(&cache->key, &found_key, sizeof(found_key)); | |
31f3c99b CM |
1729 | cache->last_alloc = cache->key.objectid; |
1730 | cache->first_free = cache->key.objectid; | |
e37c9e69 | 1731 | cache->last_prealloc = cache->key.objectid; |
be744175 | 1732 | cache->pinned = 0; |
e37c9e69 CM |
1733 | cache->cached = 0; |
1734 | ||
3e1ad54f CM |
1735 | cache->radix = radix; |
1736 | ||
9078a3e1 CM |
1737 | key.objectid = found_key.objectid + found_key.offset; |
1738 | btrfs_release_path(root, path); | |
be744175 | 1739 | ret = radix_tree_insert(radix, found_key.objectid + |
9078a3e1 CM |
1740 | found_key.offset - 1, |
1741 | (void *)cache); | |
1742 | BUG_ON(ret); | |
31f3c99b | 1743 | used = btrfs_block_group_used(bi); |
84f54cfa | 1744 | if (used < div_factor(key.offset, 8)) { |
be744175 | 1745 | radix_tree_tag_set(radix, found_key.objectid + |
31f3c99b CM |
1746 | found_key.offset - 1, |
1747 | BTRFS_BLOCK_GROUP_AVAIL); | |
1748 | } | |
9078a3e1 | 1749 | if (key.objectid >= |
4b52dff6 | 1750 | btrfs_super_total_blocks(&info->super_copy)) |
9078a3e1 CM |
1751 | break; |
1752 | } | |
1753 | ||
1754 | btrfs_free_path(path); | |
1755 | return 0; | |
1756 | } |