Btrfs: 32 bit compile fixes for the resizer and enospc checks
[linux-2.6-block.git] / fs / btrfs / extent-tree.c
CommitLineData
6cbd5570
CM
1/*
2 * Copyright (C) 2007 Oracle. All rights reserved.
3 *
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public
6 * License v2 as published by the Free Software Foundation.
7 *
8 * This program is distributed in the hope that it will be useful,
9 * but WITHOUT ANY WARRANTY; without even the implied warranty of
10 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
11 * General Public License for more details.
12 *
13 * You should have received a copy of the GNU General Public
14 * License along with this program; if not, write to the
15 * Free Software Foundation, Inc., 59 Temple Place - Suite 330,
16 * Boston, MA 021110-1307, USA.
17 */
18
ec6b910f 19#include <linux/sched.h>
7bb86316 20#include <linux/crc32c.h>
edbd8d4e 21#include <linux/pagemap.h>
74493f7a 22#include "hash.h"
fec577fb
CM
23#include "ctree.h"
24#include "disk-io.h"
25#include "print-tree.h"
e089f05c 26#include "transaction.h"
fec577fb 27
96b5179d
CM
28#define BLOCK_GROUP_DATA EXTENT_WRITEBACK
29#define BLOCK_GROUP_METADATA EXTENT_UPTODATE
30#define BLOCK_GROUP_DIRTY EXTENT_DIRTY
31
e089f05c
CM
32static int finish_current_insert(struct btrfs_trans_handle *trans, struct
33 btrfs_root *extent_root);
e20d96d6
CM
34static int del_pending_extents(struct btrfs_trans_handle *trans, struct
35 btrfs_root *extent_root);
fec577fb 36
e37c9e69
CM
37static int cache_block_group(struct btrfs_root *root,
38 struct btrfs_block_group_cache *block_group)
39{
40 struct btrfs_path *path;
41 int ret;
42 struct btrfs_key key;
5f39d397 43 struct extent_buffer *leaf;
f510cfec 44 struct extent_map_tree *free_space_cache;
e37c9e69 45 int slot;
e37c9e69
CM
46 u64 last = 0;
47 u64 hole_size;
7d7d6068 48 u64 first_free;
e37c9e69
CM
49 int found = 0;
50
00f5c795
CM
51 if (!block_group)
52 return 0;
53
e37c9e69 54 root = root->fs_info->extent_root;
f510cfec 55 free_space_cache = &root->fs_info->free_space_cache;
e37c9e69
CM
56
57 if (block_group->cached)
58 return 0;
f510cfec 59
e37c9e69
CM
60 path = btrfs_alloc_path();
61 if (!path)
62 return -ENOMEM;
7d7d6068 63
2cc58cf2 64 path->reada = 2;
7d7d6068 65 first_free = block_group->key.objectid;
e37c9e69 66 key.objectid = block_group->key.objectid;
e37c9e69 67 key.offset = 0;
7d7d6068 68
e37c9e69
CM
69 btrfs_set_key_type(&key, BTRFS_EXTENT_ITEM_KEY);
70 ret = btrfs_search_slot(NULL, root, &key, path, 0, 0);
7d7d6068 71
e37c9e69
CM
72 if (ret < 0)
73 return ret;
7d7d6068 74
e37c9e69
CM
75 if (ret && path->slots[0] > 0)
76 path->slots[0]--;
7d7d6068 77
e37c9e69 78 while(1) {
5f39d397 79 leaf = path->nodes[0];
e37c9e69 80 slot = path->slots[0];
5f39d397 81 if (slot >= btrfs_header_nritems(leaf)) {
e37c9e69 82 ret = btrfs_next_leaf(root, path);
54aa1f4d
CM
83 if (ret < 0)
84 goto err;
de428b63 85 if (ret == 0) {
e37c9e69 86 continue;
de428b63 87 } else {
e37c9e69
CM
88 break;
89 }
90 }
7d7d6068 91
5f39d397 92 btrfs_item_key_to_cpu(leaf, &key, slot);
7d7d6068 93 if (key.objectid < block_group->key.objectid) {
7bb86316
CM
94 if (btrfs_key_type(&key) != BTRFS_EXTENT_REF_KEY &&
95 key.objectid + key.offset > first_free)
7d7d6068
Y
96 first_free = key.objectid + key.offset;
97 goto next;
98 }
99
e37c9e69
CM
100 if (key.objectid >= block_group->key.objectid +
101 block_group->key.offset) {
e37c9e69
CM
102 break;
103 }
7d7d6068 104
e37c9e69
CM
105 if (btrfs_key_type(&key) == BTRFS_EXTENT_ITEM_KEY) {
106 if (!found) {
7d7d6068 107 last = first_free;
e37c9e69 108 found = 1;
e37c9e69 109 }
f510cfec
CM
110 if (key.objectid > last) {
111 hole_size = key.objectid - last;
112 set_extent_dirty(free_space_cache, last,
113 last + hole_size - 1,
114 GFP_NOFS);
7d7d6068
Y
115 }
116 last = key.objectid + key.offset;
e37c9e69 117 }
7d7d6068 118next:
e37c9e69
CM
119 path->slots[0]++;
120 }
121
7d7d6068
Y
122 if (!found)
123 last = first_free;
124 if (block_group->key.objectid +
125 block_group->key.offset > last) {
126 hole_size = block_group->key.objectid +
127 block_group->key.offset - last;
f510cfec
CM
128 set_extent_dirty(free_space_cache, last,
129 last + hole_size - 1, GFP_NOFS);
7d7d6068 130 }
e37c9e69 131 block_group->cached = 1;
54aa1f4d 132err:
e37c9e69
CM
133 btrfs_free_path(path);
134 return 0;
135}
136
5276aeda
CM
137struct btrfs_block_group_cache *btrfs_lookup_block_group(struct
138 btrfs_fs_info *info,
db94535d 139 u64 bytenr)
be744175 140{
96b5179d
CM
141 struct extent_map_tree *block_group_cache;
142 struct btrfs_block_group_cache *block_group = NULL;
143 u64 ptr;
144 u64 start;
145 u64 end;
be744175
CM
146 int ret;
147
96b5179d
CM
148 block_group_cache = &info->block_group_cache;
149 ret = find_first_extent_bit(block_group_cache,
db94535d 150 bytenr, &start, &end,
96b5179d 151 BLOCK_GROUP_DATA | BLOCK_GROUP_METADATA);
be744175 152 if (ret) {
96b5179d 153 return NULL;
be744175 154 }
96b5179d
CM
155 ret = get_state_private(block_group_cache, start, &ptr);
156 if (ret)
157 return NULL;
158
ae2f5411 159 block_group = (struct btrfs_block_group_cache *)(unsigned long)ptr;
5cf66426 160 if (block_group->key.objectid <= bytenr && bytenr <
96b5179d
CM
161 block_group->key.objectid + block_group->key.offset)
162 return block_group;
be744175
CM
163 return NULL;
164}
e37c9e69
CM
165static u64 find_search_start(struct btrfs_root *root,
166 struct btrfs_block_group_cache **cache_ret,
5e5745dc
Y
167 u64 search_start, int num,
168 int data, int full_scan)
e37c9e69 169{
e37c9e69
CM
170 int ret;
171 struct btrfs_block_group_cache *cache = *cache_ret;
e19caa5f 172 u64 last;
f510cfec
CM
173 u64 start = 0;
174 u64 end = 0;
257d0ce3 175 u64 cache_miss = 0;
f84a8b36 176 int wrapped = 0;
e37c9e69 177
00f5c795 178 if (!cache) {
1a2b2ac7 179 goto out;
00f5c795 180 }
e37c9e69 181again:
54aa1f4d
CM
182 ret = cache_block_group(root, cache);
183 if (ret)
184 goto out;
f84a8b36 185
e19caa5f
CM
186 last = max(search_start, cache->key.objectid);
187
e37c9e69 188 while(1) {
f510cfec
CM
189 ret = find_first_extent_bit(&root->fs_info->free_space_cache,
190 last, &start, &end, EXTENT_DIRTY);
e19caa5f 191 if (ret) {
257d0ce3
CM
192 if (!cache_miss)
193 cache_miss = last;
e19caa5f
CM
194 goto new_group;
195 }
f510cfec
CM
196
197 start = max(last, start);
198 last = end + 1;
257d0ce3
CM
199 if (last - start < num) {
200 if (last == cache->key.objectid + cache->key.offset)
201 cache_miss = start;
f510cfec 202 continue;
257d0ce3
CM
203 }
204 if (data != BTRFS_BLOCK_GROUP_MIXED &&
5cf66426 205 start + num > cache->key.objectid + cache->key.offset)
e37c9e69 206 goto new_group;
f510cfec 207 return start;
e37c9e69
CM
208 }
209out:
1a2b2ac7
CM
210 cache = btrfs_lookup_block_group(root->fs_info, search_start);
211 if (!cache) {
212 printk("Unable to find block group for %Lu\n",
213 search_start);
214 WARN_ON(1);
215 return search_start;
216 }
1a5bc167 217 return search_start;
e37c9e69
CM
218
219new_group:
e19caa5f 220 last = cache->key.objectid + cache->key.offset;
f84a8b36 221wrapped:
e19caa5f 222 cache = btrfs_lookup_block_group(root->fs_info, last);
e37c9e69 223 if (!cache) {
0e4de584 224no_cache:
f84a8b36
CM
225 if (!wrapped) {
226 wrapped = 1;
227 last = search_start;
228 data = BTRFS_BLOCK_GROUP_MIXED;
229 goto wrapped;
230 }
1a2b2ac7 231 goto out;
e37c9e69 232 }
257d0ce3
CM
233 if (cache_miss && !cache->cached) {
234 cache_block_group(root, cache);
235 last = cache_miss;
257d0ce3
CM
236 cache = btrfs_lookup_block_group(root->fs_info, last);
237 }
1a2b2ac7 238 cache = btrfs_find_block_group(root, cache, last, data, 0);
0e4de584
CM
239 if (!cache)
240 goto no_cache;
e37c9e69 241 *cache_ret = cache;
257d0ce3 242 cache_miss = 0;
e37c9e69
CM
243 goto again;
244}
245
84f54cfa
CM
246static u64 div_factor(u64 num, int factor)
247{
257d0ce3
CM
248 if (factor == 10)
249 return num;
84f54cfa
CM
250 num *= factor;
251 do_div(num, 10);
252 return num;
253}
254
31f3c99b
CM
255struct btrfs_block_group_cache *btrfs_find_block_group(struct btrfs_root *root,
256 struct btrfs_block_group_cache
be744175 257 *hint, u64 search_start,
de428b63 258 int data, int owner)
cd1bc465 259{
96b5179d
CM
260 struct btrfs_block_group_cache *cache;
261 struct extent_map_tree *block_group_cache;
31f3c99b 262 struct btrfs_block_group_cache *found_group = NULL;
cd1bc465
CM
263 struct btrfs_fs_info *info = root->fs_info;
264 u64 used;
31f3c99b
CM
265 u64 last = 0;
266 u64 hint_last;
96b5179d
CM
267 u64 start;
268 u64 end;
269 u64 free_check;
270 u64 ptr;
271 int bit;
cd1bc465 272 int ret;
31f3c99b 273 int full_search = 0;
de428b63 274 int factor = 8;
1e2677e0 275 int data_swap = 0;
de428b63 276
96b5179d
CM
277 block_group_cache = &info->block_group_cache;
278
de428b63 279 if (!owner)
f84a8b36 280 factor = 8;
be744175 281
257d0ce3 282 if (data == BTRFS_BLOCK_GROUP_MIXED) {
f84a8b36 283 bit = BLOCK_GROUP_DATA | BLOCK_GROUP_METADATA;
257d0ce3
CM
284 factor = 10;
285 } else if (data)
96b5179d
CM
286 bit = BLOCK_GROUP_DATA;
287 else
288 bit = BLOCK_GROUP_METADATA;
be744175
CM
289
290 if (search_start) {
291 struct btrfs_block_group_cache *shint;
5276aeda 292 shint = btrfs_lookup_block_group(info, search_start);
f84a8b36
CM
293 if (shint && (shint->data == data ||
294 shint->data == BTRFS_BLOCK_GROUP_MIXED)) {
be744175 295 used = btrfs_block_group_used(&shint->item);
324ae4df
Y
296 if (used + shint->pinned <
297 div_factor(shint->key.offset, factor)) {
be744175
CM
298 return shint;
299 }
300 }
301 }
f84a8b36
CM
302 if (hint && (hint->data == data ||
303 hint->data == BTRFS_BLOCK_GROUP_MIXED)) {
31f3c99b 304 used = btrfs_block_group_used(&hint->item);
324ae4df
Y
305 if (used + hint->pinned <
306 div_factor(hint->key.offset, factor)) {
31f3c99b
CM
307 return hint;
308 }
e19caa5f 309 last = hint->key.objectid + hint->key.offset;
31f3c99b
CM
310 hint_last = last;
311 } else {
e37c9e69
CM
312 if (hint)
313 hint_last = max(hint->key.objectid, search_start);
314 else
315 hint_last = search_start;
316
317 last = hint_last;
31f3c99b 318 }
31f3c99b 319again:
cd1bc465 320 while(1) {
96b5179d
CM
321 ret = find_first_extent_bit(block_group_cache, last,
322 &start, &end, bit);
323 if (ret)
cd1bc465 324 break;
96b5179d
CM
325
326 ret = get_state_private(block_group_cache, start, &ptr);
327 if (ret)
328 break;
329
ae2f5411 330 cache = (struct btrfs_block_group_cache *)(unsigned long)ptr;
96b5179d
CM
331 last = cache->key.objectid + cache->key.offset;
332 used = btrfs_block_group_used(&cache->item);
333
334 if (full_search)
335 free_check = cache->key.offset;
336 else
337 free_check = div_factor(cache->key.offset, factor);
324ae4df 338 if (used + cache->pinned < free_check) {
96b5179d
CM
339 found_group = cache;
340 goto found;
cd1bc465 341 }
de428b63 342 cond_resched();
cd1bc465 343 }
31f3c99b 344 if (!full_search) {
be744175 345 last = search_start;
31f3c99b
CM
346 full_search = 1;
347 goto again;
348 }
1e2677e0 349 if (!data_swap) {
1e2677e0 350 data_swap = 1;
96b5179d 351 bit = BLOCK_GROUP_DATA | BLOCK_GROUP_METADATA;
1e2677e0
CM
352 last = search_start;
353 goto again;
354 }
be744175 355found:
31f3c99b 356 return found_group;
cd1bc465
CM
357}
358
7bb86316 359static u64 hash_extent_ref(u64 root_objectid, u64 ref_generation,
74493f7a
CM
360 u64 owner, u64 owner_offset)
361{
362 u32 high_crc = ~(u32)0;
363 u32 low_crc = ~(u32)0;
364 __le64 lenum;
365
366 lenum = cpu_to_le64(root_objectid);
367 high_crc = crc32c(high_crc, &lenum, sizeof(lenum));
7bb86316
CM
368 lenum = cpu_to_le64(ref_generation);
369 low_crc = crc32c(low_crc, &lenum, sizeof(lenum));
74493f7a 370
7bb86316 371#if 0
74493f7a
CM
372 lenum = cpu_to_le64(owner);
373 low_crc = crc32c(low_crc, &lenum, sizeof(lenum));
74493f7a
CM
374 lenum = cpu_to_le64(owner_offset);
375 low_crc = crc32c(low_crc, &lenum, sizeof(lenum));
7bb86316 376#endif
74493f7a
CM
377 return ((u64)high_crc << 32) | (u64)low_crc;
378}
379
7bb86316
CM
380static int match_extent_ref(struct extent_buffer *leaf,
381 struct btrfs_extent_ref *disk_ref,
382 struct btrfs_extent_ref *cpu_ref)
383{
384 int ret;
385 int len;
386
387 if (cpu_ref->objectid)
388 len = sizeof(*cpu_ref);
389 else
390 len = 2 * sizeof(u64);
391 ret = memcmp_extent_buffer(leaf, cpu_ref, (unsigned long)disk_ref,
392 len);
393 return ret == 0;
394}
395
396static int lookup_extent_backref(struct btrfs_trans_handle *trans,
397 struct btrfs_root *root,
398 struct btrfs_path *path, u64 bytenr,
399 u64 root_objectid, u64 ref_generation,
400 u64 owner, u64 owner_offset, int del)
74493f7a
CM
401{
402 u64 hash;
403 struct btrfs_key key;
7bb86316 404 struct btrfs_key found_key;
74493f7a 405 struct btrfs_extent_ref ref;
7bb86316
CM
406 struct extent_buffer *leaf;
407 struct btrfs_extent_ref *disk_ref;
408 int ret;
409 int ret2;
410
411 btrfs_set_stack_ref_root(&ref, root_objectid);
412 btrfs_set_stack_ref_generation(&ref, ref_generation);
413 btrfs_set_stack_ref_objectid(&ref, owner);
414 btrfs_set_stack_ref_offset(&ref, owner_offset);
415
416 hash = hash_extent_ref(root_objectid, ref_generation, owner,
417 owner_offset);
418 key.offset = hash;
419 key.objectid = bytenr;
420 key.type = BTRFS_EXTENT_REF_KEY;
421
422 while (1) {
423 ret = btrfs_search_slot(trans, root, &key, path,
424 del ? -1 : 0, del);
425 if (ret < 0)
426 goto out;
427 leaf = path->nodes[0];
428 if (ret != 0) {
429 u32 nritems = btrfs_header_nritems(leaf);
430 if (path->slots[0] >= nritems) {
431 ret2 = btrfs_next_leaf(root, path);
432 if (ret2)
433 goto out;
434 leaf = path->nodes[0];
435 }
436 btrfs_item_key_to_cpu(leaf, &found_key, path->slots[0]);
437 if (found_key.objectid != bytenr ||
438 found_key.type != BTRFS_EXTENT_REF_KEY)
439 goto out;
440 key.offset = found_key.offset;
441 if (del) {
442 btrfs_release_path(root, path);
443 continue;
444 }
445 }
446 disk_ref = btrfs_item_ptr(path->nodes[0],
447 path->slots[0],
448 struct btrfs_extent_ref);
449 if (match_extent_ref(path->nodes[0], disk_ref, &ref)) {
450 ret = 0;
451 goto out;
452 }
453 btrfs_item_key_to_cpu(leaf, &found_key, path->slots[0]);
454 key.offset = found_key.offset + 1;
455 btrfs_release_path(root, path);
456 }
457out:
458 return ret;
459}
460
d8d5f3e1
CM
461/*
462 * Back reference rules. Back refs have three main goals:
463 *
464 * 1) differentiate between all holders of references to an extent so that
465 * when a reference is dropped we can make sure it was a valid reference
466 * before freeing the extent.
467 *
468 * 2) Provide enough information to quickly find the holders of an extent
469 * if we notice a given block is corrupted or bad.
470 *
471 * 3) Make it easy to migrate blocks for FS shrinking or storage pool
472 * maintenance. This is actually the same as #2, but with a slightly
473 * different use case.
474 *
475 * File extents can be referenced by:
476 *
477 * - multiple snapshots, subvolumes, or different generations in one subvol
478 * - different files inside a single subvolume (in theory, not implemented yet)
479 * - different offsets inside a file (bookend extents in file.c)
480 *
481 * The extent ref structure has fields for:
482 *
483 * - Objectid of the subvolume root
484 * - Generation number of the tree holding the reference
485 * - objectid of the file holding the reference
486 * - offset in the file corresponding to the key holding the reference
487 *
488 * When a file extent is allocated the fields are filled in:
489 * (root_key.objectid, trans->transid, inode objectid, offset in file)
490 *
491 * When a leaf is cow'd new references are added for every file extent found
492 * in the leaf. It looks the same as the create case, but trans->transid
493 * will be different when the block is cow'd.
494 *
495 * (root_key.objectid, trans->transid, inode objectid, offset in file)
496 *
497 * When a file extent is removed either during snapshot deletion or file
498 * truncation, the corresponding back reference is found
499 * by searching for:
500 *
501 * (btrfs_header_owner(leaf), btrfs_header_generation(leaf),
502 * inode objectid, offset in file)
503 *
504 * Btree extents can be referenced by:
505 *
506 * - Different subvolumes
507 * - Different generations of the same subvolume
508 *
509 * Storing sufficient information for a full reverse mapping of a btree
510 * block would require storing the lowest key of the block in the backref,
511 * and it would require updating that lowest key either before write out or
512 * every time it changed. Instead, the objectid of the lowest key is stored
513 * along with the level of the tree block. This provides a hint
514 * about where in the btree the block can be found. Searches through the
515 * btree only need to look for a pointer to that block, so they stop one
516 * level higher than the level recorded in the backref.
517 *
518 * Some btrees do not do reference counting on their extents. These
519 * include the extent tree and the tree of tree roots. Backrefs for these
520 * trees always have a generation of zero.
521 *
522 * When a tree block is created, back references are inserted:
523 *
f6dbff55 524 * (root->root_key.objectid, trans->transid or zero, level, lowest_key_objectid)
d8d5f3e1
CM
525 *
526 * When a tree block is cow'd in a reference counted root,
527 * new back references are added for all the blocks it points to.
528 * These are of the form (trans->transid will have increased since creation):
529 *
f6dbff55 530 * (root->root_key.objectid, trans->transid, level, lowest_key_objectid)
d8d5f3e1
CM
531 *
532 * Because the lowest_key_objectid and the level are just hints
533 * they are not used when backrefs are deleted. When a backref is deleted:
534 *
535 * if backref was for a tree root:
536 * root_objectid = root->root_key.objectid
537 * else
538 * root_objectid = btrfs_header_owner(parent)
539 *
540 * (root_objectid, btrfs_header_generation(parent) or zero, 0, 0)
541 *
542 * Back Reference Key hashing:
543 *
544 * Back references have four fields, each 64 bits long. Unfortunately,
545 * This is hashed into a single 64 bit number and placed into the key offset.
546 * The key objectid corresponds to the first byte in the extent, and the
547 * key type is set to BTRFS_EXTENT_REF_KEY
548 */
7bb86316
CM
549int btrfs_insert_extent_backref(struct btrfs_trans_handle *trans,
550 struct btrfs_root *root,
551 struct btrfs_path *path, u64 bytenr,
552 u64 root_objectid, u64 ref_generation,
553 u64 owner, u64 owner_offset)
554{
555 u64 hash;
556 struct btrfs_key key;
557 struct btrfs_extent_ref ref;
558 struct btrfs_extent_ref *disk_ref;
74493f7a
CM
559 int ret;
560
561 btrfs_set_stack_ref_root(&ref, root_objectid);
7bb86316 562 btrfs_set_stack_ref_generation(&ref, ref_generation);
74493f7a
CM
563 btrfs_set_stack_ref_objectid(&ref, owner);
564 btrfs_set_stack_ref_offset(&ref, owner_offset);
565
7bb86316
CM
566 hash = hash_extent_ref(root_objectid, ref_generation, owner,
567 owner_offset);
74493f7a
CM
568 key.offset = hash;
569 key.objectid = bytenr;
570 key.type = BTRFS_EXTENT_REF_KEY;
571
572 ret = btrfs_insert_empty_item(trans, root, path, &key, sizeof(ref));
573 while (ret == -EEXIST) {
7bb86316
CM
574 disk_ref = btrfs_item_ptr(path->nodes[0], path->slots[0],
575 struct btrfs_extent_ref);
576 if (match_extent_ref(path->nodes[0], disk_ref, &ref))
577 goto out;
578 key.offset++;
579 btrfs_release_path(root, path);
580 ret = btrfs_insert_empty_item(trans, root, path, &key,
581 sizeof(ref));
74493f7a 582 }
7bb86316
CM
583 if (ret)
584 goto out;
585 disk_ref = btrfs_item_ptr(path->nodes[0], path->slots[0],
586 struct btrfs_extent_ref);
587 write_extent_buffer(path->nodes[0], &ref, (unsigned long)disk_ref,
588 sizeof(ref));
589 btrfs_mark_buffer_dirty(path->nodes[0]);
590out:
591 btrfs_release_path(root, path);
592 return ret;
74493f7a
CM
593}
594
b18c6685
CM
595int btrfs_inc_extent_ref(struct btrfs_trans_handle *trans,
596 struct btrfs_root *root,
74493f7a 597 u64 bytenr, u64 num_bytes,
7bb86316 598 u64 root_objectid, u64 ref_generation,
74493f7a 599 u64 owner, u64 owner_offset)
02217ed2 600{
5caf2a00 601 struct btrfs_path *path;
02217ed2 602 int ret;
e2fa7227 603 struct btrfs_key key;
5f39d397 604 struct extent_buffer *l;
234b63a0 605 struct btrfs_extent_item *item;
cf27e1ee 606 u32 refs;
037e6390 607
db94535d 608 WARN_ON(num_bytes < root->sectorsize);
5caf2a00 609 path = btrfs_alloc_path();
54aa1f4d
CM
610 if (!path)
611 return -ENOMEM;
26b8003f 612
db94535d 613 key.objectid = bytenr;
62e2749e 614 btrfs_set_key_type(&key, BTRFS_EXTENT_ITEM_KEY);
db94535d 615 key.offset = num_bytes;
5caf2a00 616 ret = btrfs_search_slot(trans, root->fs_info->extent_root, &key, path,
9f5fae2f 617 0, 1);
54aa1f4d
CM
618 if (ret < 0)
619 return ret;
a429e513 620 if (ret != 0) {
a28ec197 621 BUG();
a429e513 622 }
02217ed2 623 BUG_ON(ret != 0);
5f39d397 624 l = path->nodes[0];
5caf2a00 625 item = btrfs_item_ptr(l, path->slots[0], struct btrfs_extent_item);
5f39d397
CM
626 refs = btrfs_extent_refs(l, item);
627 btrfs_set_extent_refs(l, item, refs + 1);
5caf2a00 628 btrfs_mark_buffer_dirty(path->nodes[0]);
a28ec197 629
5caf2a00 630 btrfs_release_path(root->fs_info->extent_root, path);
7bb86316
CM
631
632 ret = btrfs_insert_extent_backref(trans, root->fs_info->extent_root,
633 path, bytenr, root_objectid,
634 ref_generation, owner, owner_offset);
635 BUG_ON(ret);
9f5fae2f 636 finish_current_insert(trans, root->fs_info->extent_root);
e20d96d6 637 del_pending_extents(trans, root->fs_info->extent_root);
74493f7a
CM
638
639 btrfs_free_path(path);
02217ed2
CM
640 return 0;
641}
642
e9d0b13b
CM
643int btrfs_extent_post_op(struct btrfs_trans_handle *trans,
644 struct btrfs_root *root)
645{
646 finish_current_insert(trans, root->fs_info->extent_root);
647 del_pending_extents(trans, root->fs_info->extent_root);
648 return 0;
649}
650
b18c6685 651static int lookup_extent_ref(struct btrfs_trans_handle *trans,
db94535d
CM
652 struct btrfs_root *root, u64 bytenr,
653 u64 num_bytes, u32 *refs)
a28ec197 654{
5caf2a00 655 struct btrfs_path *path;
a28ec197 656 int ret;
e2fa7227 657 struct btrfs_key key;
5f39d397 658 struct extent_buffer *l;
234b63a0 659 struct btrfs_extent_item *item;
5caf2a00 660
db94535d 661 WARN_ON(num_bytes < root->sectorsize);
5caf2a00 662 path = btrfs_alloc_path();
db94535d
CM
663 key.objectid = bytenr;
664 key.offset = num_bytes;
62e2749e 665 btrfs_set_key_type(&key, BTRFS_EXTENT_ITEM_KEY);
5caf2a00 666 ret = btrfs_search_slot(trans, root->fs_info->extent_root, &key, path,
9f5fae2f 667 0, 0);
54aa1f4d
CM
668 if (ret < 0)
669 goto out;
5f39d397
CM
670 if (ret != 0) {
671 btrfs_print_leaf(root, path->nodes[0]);
db94535d 672 printk("failed to find block number %Lu\n", bytenr);
a28ec197 673 BUG();
5f39d397
CM
674 }
675 l = path->nodes[0];
5caf2a00 676 item = btrfs_item_ptr(l, path->slots[0], struct btrfs_extent_item);
5f39d397 677 *refs = btrfs_extent_refs(l, item);
54aa1f4d 678out:
5caf2a00 679 btrfs_free_path(path);
a28ec197
CM
680 return 0;
681}
682
be20aa9d
CM
683u32 btrfs_count_snapshots_in_path(struct btrfs_root *root,
684 struct btrfs_path *count_path,
685 u64 first_extent)
686{
687 struct btrfs_root *extent_root = root->fs_info->extent_root;
688 struct btrfs_path *path;
689 u64 bytenr;
690 u64 found_objectid;
56b453c9 691 u64 root_objectid = root->root_key.objectid;
be20aa9d
CM
692 u32 total_count = 0;
693 u32 cur_count;
694 u32 refs;
695 u32 nritems;
696 int ret;
697 struct btrfs_key key;
698 struct btrfs_key found_key;
699 struct extent_buffer *l;
700 struct btrfs_extent_item *item;
701 struct btrfs_extent_ref *ref_item;
702 int level = -1;
703
704 path = btrfs_alloc_path();
705again:
706 if (level == -1)
707 bytenr = first_extent;
708 else
709 bytenr = count_path->nodes[level]->start;
710
711 cur_count = 0;
712 key.objectid = bytenr;
713 key.offset = 0;
714
715 btrfs_set_key_type(&key, BTRFS_EXTENT_ITEM_KEY);
716 ret = btrfs_search_slot(NULL, extent_root, &key, path, 0, 0);
717 if (ret < 0)
718 goto out;
719 BUG_ON(ret == 0);
720
721 l = path->nodes[0];
722 btrfs_item_key_to_cpu(l, &found_key, path->slots[0]);
723
724 if (found_key.objectid != bytenr ||
725 found_key.type != BTRFS_EXTENT_ITEM_KEY) {
726 goto out;
727 }
728
729 item = btrfs_item_ptr(l, path->slots[0], struct btrfs_extent_item);
730 refs = btrfs_extent_refs(l, item);
731 while (1) {
732 nritems = btrfs_header_nritems(l);
733 if (path->slots[0] >= nritems) {
734 ret = btrfs_next_leaf(extent_root, path);
735 if (ret == 0)
736 continue;
737 break;
738 }
739 btrfs_item_key_to_cpu(l, &found_key, path->slots[0]);
740 if (found_key.objectid != bytenr)
741 break;
742 if (found_key.type != BTRFS_EXTENT_REF_KEY) {
743 path->slots[0]++;
744 continue;
745 }
746
747 cur_count++;
748 ref_item = btrfs_item_ptr(l, path->slots[0],
749 struct btrfs_extent_ref);
750 found_objectid = btrfs_ref_root(l, ref_item);
751
56b453c9
CM
752 if (found_objectid != root_objectid) {
753 total_count = 2;
4313b399 754 goto out;
56b453c9
CM
755 }
756 total_count = 1;
be20aa9d
CM
757 path->slots[0]++;
758 }
759 if (cur_count == 0) {
760 total_count = 0;
761 goto out;
762 }
be20aa9d
CM
763 if (level >= 0 && root->node == count_path->nodes[level])
764 goto out;
765 level++;
766 btrfs_release_path(root, path);
767 goto again;
768
769out:
770 btrfs_free_path(path);
771 return total_count;
772
773}
774
c5739bba 775int btrfs_inc_root_ref(struct btrfs_trans_handle *trans,
7bb86316 776 struct btrfs_root *root, u64 owner_objectid)
c5739bba 777{
7bb86316
CM
778 u64 generation;
779 u64 key_objectid;
780 u64 level;
781 u32 nritems;
782 struct btrfs_disk_key disk_key;
783
784 level = btrfs_header_level(root->node);
785 generation = trans->transid;
786 nritems = btrfs_header_nritems(root->node);
787 if (nritems > 0) {
788 if (level == 0)
789 btrfs_item_key(root->node, &disk_key, 0);
790 else
791 btrfs_node_key(root->node, &disk_key, 0);
792 key_objectid = btrfs_disk_key_objectid(&disk_key);
793 } else {
794 key_objectid = 0;
795 }
db94535d 796 return btrfs_inc_extent_ref(trans, root, root->node->start,
7bb86316 797 root->node->len, owner_objectid,
f6dbff55 798 generation, level, key_objectid);
c5739bba
CM
799}
800
e089f05c 801int btrfs_inc_ref(struct btrfs_trans_handle *trans, struct btrfs_root *root,
5f39d397 802 struct extent_buffer *buf)
02217ed2 803{
db94535d 804 u64 bytenr;
5f39d397
CM
805 u32 nritems;
806 struct btrfs_key key;
6407bf6d 807 struct btrfs_file_extent_item *fi;
02217ed2 808 int i;
db94535d 809 int level;
6407bf6d 810 int ret;
54aa1f4d 811 int faili;
a28ec197 812
3768f368 813 if (!root->ref_cows)
a28ec197 814 return 0;
5f39d397 815
db94535d 816 level = btrfs_header_level(buf);
5f39d397
CM
817 nritems = btrfs_header_nritems(buf);
818 for (i = 0; i < nritems; i++) {
db94535d
CM
819 if (level == 0) {
820 u64 disk_bytenr;
5f39d397
CM
821 btrfs_item_key_to_cpu(buf, &key, i);
822 if (btrfs_key_type(&key) != BTRFS_EXTENT_DATA_KEY)
6407bf6d 823 continue;
5f39d397 824 fi = btrfs_item_ptr(buf, i,
6407bf6d 825 struct btrfs_file_extent_item);
5f39d397 826 if (btrfs_file_extent_type(buf, fi) ==
236454df
CM
827 BTRFS_FILE_EXTENT_INLINE)
828 continue;
db94535d
CM
829 disk_bytenr = btrfs_file_extent_disk_bytenr(buf, fi);
830 if (disk_bytenr == 0)
3a686375 831 continue;
db94535d 832 ret = btrfs_inc_extent_ref(trans, root, disk_bytenr,
7bb86316
CM
833 btrfs_file_extent_disk_num_bytes(buf, fi),
834 root->root_key.objectid, trans->transid,
835 key.objectid, key.offset);
54aa1f4d
CM
836 if (ret) {
837 faili = i;
838 goto fail;
839 }
6407bf6d 840 } else {
db94535d 841 bytenr = btrfs_node_blockptr(buf, i);
6caab489 842 btrfs_node_key_to_cpu(buf, &key, i);
db94535d 843 ret = btrfs_inc_extent_ref(trans, root, bytenr,
7bb86316
CM
844 btrfs_level_size(root, level - 1),
845 root->root_key.objectid,
f6dbff55
CM
846 trans->transid,
847 level - 1, key.objectid);
54aa1f4d
CM
848 if (ret) {
849 faili = i;
850 goto fail;
851 }
6407bf6d 852 }
02217ed2
CM
853 }
854 return 0;
54aa1f4d 855fail:
ccd467d6 856 WARN_ON(1);
7bb86316 857#if 0
54aa1f4d 858 for (i =0; i < faili; i++) {
db94535d
CM
859 if (level == 0) {
860 u64 disk_bytenr;
5f39d397
CM
861 btrfs_item_key_to_cpu(buf, &key, i);
862 if (btrfs_key_type(&key) != BTRFS_EXTENT_DATA_KEY)
54aa1f4d 863 continue;
5f39d397 864 fi = btrfs_item_ptr(buf, i,
54aa1f4d 865 struct btrfs_file_extent_item);
5f39d397 866 if (btrfs_file_extent_type(buf, fi) ==
54aa1f4d
CM
867 BTRFS_FILE_EXTENT_INLINE)
868 continue;
db94535d
CM
869 disk_bytenr = btrfs_file_extent_disk_bytenr(buf, fi);
870 if (disk_bytenr == 0)
54aa1f4d 871 continue;
db94535d
CM
872 err = btrfs_free_extent(trans, root, disk_bytenr,
873 btrfs_file_extent_disk_num_bytes(buf,
5f39d397 874 fi), 0);
54aa1f4d
CM
875 BUG_ON(err);
876 } else {
db94535d
CM
877 bytenr = btrfs_node_blockptr(buf, i);
878 err = btrfs_free_extent(trans, root, bytenr,
879 btrfs_level_size(root, level - 1), 0);
54aa1f4d
CM
880 BUG_ON(err);
881 }
882 }
7bb86316 883#endif
54aa1f4d 884 return ret;
02217ed2
CM
885}
886
9078a3e1
CM
887static int write_one_cache_group(struct btrfs_trans_handle *trans,
888 struct btrfs_root *root,
889 struct btrfs_path *path,
890 struct btrfs_block_group_cache *cache)
891{
892 int ret;
893 int pending_ret;
894 struct btrfs_root *extent_root = root->fs_info->extent_root;
5f39d397
CM
895 unsigned long bi;
896 struct extent_buffer *leaf;
9078a3e1 897
9078a3e1 898 ret = btrfs_search_slot(trans, extent_root, &cache->key, path, 0, 1);
54aa1f4d
CM
899 if (ret < 0)
900 goto fail;
9078a3e1 901 BUG_ON(ret);
5f39d397
CM
902
903 leaf = path->nodes[0];
904 bi = btrfs_item_ptr_offset(leaf, path->slots[0]);
905 write_extent_buffer(leaf, &cache->item, bi, sizeof(cache->item));
906 btrfs_mark_buffer_dirty(leaf);
9078a3e1 907 btrfs_release_path(extent_root, path);
54aa1f4d 908fail:
9078a3e1
CM
909 finish_current_insert(trans, extent_root);
910 pending_ret = del_pending_extents(trans, extent_root);
911 if (ret)
912 return ret;
913 if (pending_ret)
914 return pending_ret;
915 return 0;
916
917}
918
96b5179d
CM
919int btrfs_write_dirty_block_groups(struct btrfs_trans_handle *trans,
920 struct btrfs_root *root)
9078a3e1 921{
96b5179d
CM
922 struct extent_map_tree *block_group_cache;
923 struct btrfs_block_group_cache *cache;
9078a3e1
CM
924 int ret;
925 int err = 0;
926 int werr = 0;
9078a3e1 927 struct btrfs_path *path;
96b5179d
CM
928 u64 last = 0;
929 u64 start;
930 u64 end;
931 u64 ptr;
9078a3e1 932
96b5179d 933 block_group_cache = &root->fs_info->block_group_cache;
9078a3e1
CM
934 path = btrfs_alloc_path();
935 if (!path)
936 return -ENOMEM;
937
938 while(1) {
96b5179d
CM
939 ret = find_first_extent_bit(block_group_cache, last,
940 &start, &end, BLOCK_GROUP_DIRTY);
941 if (ret)
9078a3e1 942 break;
54aa1f4d 943
96b5179d
CM
944 last = end + 1;
945 ret = get_state_private(block_group_cache, start, &ptr);
946 if (ret)
947 break;
948
ae2f5411 949 cache = (struct btrfs_block_group_cache *)(unsigned long)ptr;
96b5179d
CM
950 err = write_one_cache_group(trans, root,
951 path, cache);
952 /*
953 * if we fail to write the cache group, we want
954 * to keep it marked dirty in hopes that a later
955 * write will work
956 */
957 if (err) {
958 werr = err;
959 continue;
9078a3e1 960 }
96b5179d
CM
961 clear_extent_bits(block_group_cache, start, end,
962 BLOCK_GROUP_DIRTY, GFP_NOFS);
9078a3e1
CM
963 }
964 btrfs_free_path(path);
965 return werr;
966}
967
968static int update_block_group(struct btrfs_trans_handle *trans,
969 struct btrfs_root *root,
db94535d
CM
970 u64 bytenr, u64 num_bytes, int alloc,
971 int mark_free, int data)
9078a3e1
CM
972{
973 struct btrfs_block_group_cache *cache;
974 struct btrfs_fs_info *info = root->fs_info;
db94535d 975 u64 total = num_bytes;
9078a3e1 976 u64 old_val;
db94535d 977 u64 byte_in_group;
96b5179d
CM
978 u64 start;
979 u64 end;
3e1ad54f 980
9078a3e1 981 while(total) {
db94535d 982 cache = btrfs_lookup_block_group(info, bytenr);
3e1ad54f 983 if (!cache) {
9078a3e1 984 return -1;
cd1bc465 985 }
db94535d
CM
986 byte_in_group = bytenr - cache->key.objectid;
987 WARN_ON(byte_in_group > cache->key.offset);
96b5179d
CM
988 start = cache->key.objectid;
989 end = start + cache->key.offset - 1;
990 set_extent_bits(&info->block_group_cache, start, end,
991 BLOCK_GROUP_DIRTY, GFP_NOFS);
9078a3e1
CM
992
993 old_val = btrfs_block_group_used(&cache->item);
db94535d 994 num_bytes = min(total, cache->key.offset - byte_in_group);
cd1bc465 995 if (alloc) {
1e2677e0 996 if (cache->data != data &&
84f54cfa 997 old_val < (cache->key.offset >> 1)) {
96b5179d
CM
998 int bit_to_clear;
999 int bit_to_set;
96b5179d 1000 cache->data = data;
1e2677e0 1001 if (data) {
b97f9203
Y
1002 bit_to_clear = BLOCK_GROUP_METADATA;
1003 bit_to_set = BLOCK_GROUP_DATA;
f84a8b36
CM
1004 cache->item.flags &=
1005 ~BTRFS_BLOCK_GROUP_MIXED;
1e2677e0
CM
1006 cache->item.flags |=
1007 BTRFS_BLOCK_GROUP_DATA;
1008 } else {
b97f9203
Y
1009 bit_to_clear = BLOCK_GROUP_DATA;
1010 bit_to_set = BLOCK_GROUP_METADATA;
f84a8b36
CM
1011 cache->item.flags &=
1012 ~BTRFS_BLOCK_GROUP_MIXED;
1e2677e0
CM
1013 cache->item.flags &=
1014 ~BTRFS_BLOCK_GROUP_DATA;
1015 }
96b5179d
CM
1016 clear_extent_bits(&info->block_group_cache,
1017 start, end, bit_to_clear,
1018 GFP_NOFS);
1019 set_extent_bits(&info->block_group_cache,
1020 start, end, bit_to_set,
1021 GFP_NOFS);
f84a8b36
CM
1022 } else if (cache->data != data &&
1023 cache->data != BTRFS_BLOCK_GROUP_MIXED) {
1024 cache->data = BTRFS_BLOCK_GROUP_MIXED;
1025 set_extent_bits(&info->block_group_cache,
1026 start, end,
1027 BLOCK_GROUP_DATA |
1028 BLOCK_GROUP_METADATA,
1029 GFP_NOFS);
1e2677e0 1030 }
db94535d 1031 old_val += num_bytes;
cd1bc465 1032 } else {
db94535d 1033 old_val -= num_bytes;
f510cfec
CM
1034 if (mark_free) {
1035 set_extent_dirty(&info->free_space_cache,
db94535d 1036 bytenr, bytenr + num_bytes - 1,
f510cfec 1037 GFP_NOFS);
e37c9e69 1038 }
cd1bc465 1039 }
9078a3e1 1040 btrfs_set_block_group_used(&cache->item, old_val);
db94535d
CM
1041 total -= num_bytes;
1042 bytenr += num_bytes;
9078a3e1
CM
1043 }
1044 return 0;
1045}
324ae4df
Y
1046static int update_pinned_extents(struct btrfs_root *root,
1047 u64 bytenr, u64 num, int pin)
1048{
1049 u64 len;
1050 struct btrfs_block_group_cache *cache;
1051 struct btrfs_fs_info *fs_info = root->fs_info;
1052
1053 if (pin) {
1054 set_extent_dirty(&fs_info->pinned_extents,
1055 bytenr, bytenr + num - 1, GFP_NOFS);
1056 } else {
1057 clear_extent_dirty(&fs_info->pinned_extents,
1058 bytenr, bytenr + num - 1, GFP_NOFS);
1059 }
1060 while (num > 0) {
1061 cache = btrfs_lookup_block_group(fs_info, bytenr);
1062 WARN_ON(!cache);
1063 len = min(num, cache->key.offset -
1064 (bytenr - cache->key.objectid));
1065 if (pin) {
1066 cache->pinned += len;
1067 fs_info->total_pinned += len;
1068 } else {
1069 cache->pinned -= len;
1070 fs_info->total_pinned -= len;
1071 }
1072 bytenr += len;
1073 num -= len;
1074 }
1075 return 0;
1076}
9078a3e1 1077
1a5bc167 1078int btrfs_copy_pinned(struct btrfs_root *root, struct extent_map_tree *copy)
ccd467d6 1079{
ccd467d6 1080 u64 last = 0;
1a5bc167
CM
1081 u64 start;
1082 u64 end;
1083 struct extent_map_tree *pinned_extents = &root->fs_info->pinned_extents;
ccd467d6 1084 int ret;
ccd467d6
CM
1085
1086 while(1) {
1a5bc167
CM
1087 ret = find_first_extent_bit(pinned_extents, last,
1088 &start, &end, EXTENT_DIRTY);
1089 if (ret)
ccd467d6 1090 break;
1a5bc167
CM
1091 set_extent_dirty(copy, start, end, GFP_NOFS);
1092 last = end + 1;
ccd467d6
CM
1093 }
1094 return 0;
1095}
1096
1097int btrfs_finish_extent_commit(struct btrfs_trans_handle *trans,
1098 struct btrfs_root *root,
1a5bc167 1099 struct extent_map_tree *unpin)
a28ec197 1100{
1a5bc167
CM
1101 u64 start;
1102 u64 end;
a28ec197 1103 int ret;
f510cfec 1104 struct extent_map_tree *free_space_cache;
f510cfec 1105 free_space_cache = &root->fs_info->free_space_cache;
a28ec197
CM
1106
1107 while(1) {
1a5bc167
CM
1108 ret = find_first_extent_bit(unpin, 0, &start, &end,
1109 EXTENT_DIRTY);
1110 if (ret)
a28ec197 1111 break;
324ae4df 1112 update_pinned_extents(root, start, end + 1 - start, 0);
1a5bc167
CM
1113 clear_extent_dirty(unpin, start, end, GFP_NOFS);
1114 set_extent_dirty(free_space_cache, start, end, GFP_NOFS);
a28ec197
CM
1115 }
1116 return 0;
1117}
1118
e089f05c
CM
1119static int finish_current_insert(struct btrfs_trans_handle *trans, struct
1120 btrfs_root *extent_root)
037e6390 1121{
7bb86316
CM
1122 u64 start;
1123 u64 end;
1124 struct btrfs_fs_info *info = extent_root->fs_info;
d8d5f3e1 1125 struct extent_buffer *eb;
7bb86316 1126 struct btrfs_path *path;
e2fa7227 1127 struct btrfs_key ins;
d8d5f3e1 1128 struct btrfs_disk_key first;
234b63a0 1129 struct btrfs_extent_item extent_item;
037e6390 1130 int ret;
d8d5f3e1 1131 int level;
1a5bc167 1132 int err = 0;
037e6390 1133
5f39d397 1134 btrfs_set_stack_extent_refs(&extent_item, 1);
62e2749e 1135 btrfs_set_key_type(&ins, BTRFS_EXTENT_ITEM_KEY);
7bb86316 1136 path = btrfs_alloc_path();
037e6390 1137
26b8003f 1138 while(1) {
1a5bc167
CM
1139 ret = find_first_extent_bit(&info->extent_ins, 0, &start,
1140 &end, EXTENT_LOCKED);
1141 if (ret)
26b8003f
CM
1142 break;
1143
1a5bc167
CM
1144 ins.objectid = start;
1145 ins.offset = end + 1 - start;
1146 err = btrfs_insert_item(trans, extent_root, &ins,
1147 &extent_item, sizeof(extent_item));
1148 clear_extent_bits(&info->extent_ins, start, end, EXTENT_LOCKED,
1149 GFP_NOFS);
d8d5f3e1
CM
1150 eb = read_tree_block(extent_root, ins.objectid, ins.offset);
1151 level = btrfs_header_level(eb);
1152 if (level == 0) {
1153 btrfs_item_key(eb, &first, 0);
1154 } else {
1155 btrfs_node_key(eb, &first, 0);
1156 }
7bb86316
CM
1157 err = btrfs_insert_extent_backref(trans, extent_root, path,
1158 start, extent_root->root_key.objectid,
f6dbff55
CM
1159 0, level,
1160 btrfs_disk_key_objectid(&first));
7bb86316 1161 BUG_ON(err);
d8d5f3e1 1162 free_extent_buffer(eb);
037e6390 1163 }
7bb86316 1164 btrfs_free_path(path);
037e6390
CM
1165 return 0;
1166}
1167
db94535d
CM
1168static int pin_down_bytes(struct btrfs_root *root, u64 bytenr, u32 num_bytes,
1169 int pending)
e20d96d6 1170{
1a5bc167 1171 int err = 0;
5f39d397 1172 struct extent_buffer *buf;
8ef97622 1173
f4b9aa8d 1174 if (!pending) {
db94535d 1175 buf = btrfs_find_tree_block(root, bytenr, num_bytes);
5f39d397
CM
1176 if (buf) {
1177 if (btrfs_buffer_uptodate(buf)) {
2c90e5d6
CM
1178 u64 transid =
1179 root->fs_info->running_transaction->transid;
5f39d397
CM
1180 if (btrfs_header_generation(buf) == transid) {
1181 free_extent_buffer(buf);
c549228f 1182 return 1;
2c90e5d6 1183 }
f4b9aa8d 1184 }
5f39d397 1185 free_extent_buffer(buf);
8ef97622 1186 }
324ae4df 1187 update_pinned_extents(root, bytenr, num_bytes, 1);
f4b9aa8d 1188 } else {
1a5bc167 1189 set_extent_bits(&root->fs_info->pending_del,
db94535d
CM
1190 bytenr, bytenr + num_bytes - 1,
1191 EXTENT_LOCKED, GFP_NOFS);
f4b9aa8d 1192 }
be744175 1193 BUG_ON(err < 0);
e20d96d6
CM
1194 return 0;
1195}
1196
fec577fb 1197/*
a28ec197 1198 * remove an extent from the root, returns 0 on success
fec577fb 1199 */
e089f05c 1200static int __free_extent(struct btrfs_trans_handle *trans, struct btrfs_root
7bb86316
CM
1201 *root, u64 bytenr, u64 num_bytes,
1202 u64 root_objectid, u64 ref_generation,
1203 u64 owner_objectid, u64 owner_offset, int pin,
e37c9e69 1204 int mark_free)
a28ec197 1205{
5caf2a00 1206 struct btrfs_path *path;
e2fa7227 1207 struct btrfs_key key;
1261ec42
CM
1208 struct btrfs_fs_info *info = root->fs_info;
1209 struct btrfs_root *extent_root = info->extent_root;
5f39d397 1210 struct extent_buffer *leaf;
a28ec197 1211 int ret;
234b63a0 1212 struct btrfs_extent_item *ei;
cf27e1ee 1213 u32 refs;
037e6390 1214
db94535d 1215 key.objectid = bytenr;
62e2749e 1216 btrfs_set_key_type(&key, BTRFS_EXTENT_ITEM_KEY);
db94535d 1217 key.offset = num_bytes;
a28ec197 1218
5caf2a00 1219 path = btrfs_alloc_path();
54aa1f4d
CM
1220 if (!path)
1221 return -ENOMEM;
5f26f772 1222
7bb86316
CM
1223 ret = lookup_extent_backref(trans, extent_root, path,
1224 bytenr, root_objectid,
1225 ref_generation,
1226 owner_objectid, owner_offset, 1);
1227 if (ret == 0) {
1228 ret = btrfs_del_item(trans, extent_root, path);
1229 } else {
1230 btrfs_print_leaf(extent_root, path->nodes[0]);
1231 WARN_ON(1);
1232 printk("Unable to find ref byte nr %Lu root %Lu "
1233 " gen %Lu owner %Lu offset %Lu\n", bytenr,
1234 root_objectid, ref_generation, owner_objectid,
1235 owner_offset);
1236 }
1237 btrfs_release_path(extent_root, path);
54aa1f4d
CM
1238 ret = btrfs_search_slot(trans, extent_root, &key, path, -1, 1);
1239 if (ret < 0)
1240 return ret;
1241 BUG_ON(ret);
5f39d397
CM
1242
1243 leaf = path->nodes[0];
1244 ei = btrfs_item_ptr(leaf, path->slots[0],
123abc88 1245 struct btrfs_extent_item);
5f39d397
CM
1246 refs = btrfs_extent_refs(leaf, ei);
1247 BUG_ON(refs == 0);
1248 refs -= 1;
1249 btrfs_set_extent_refs(leaf, ei, refs);
1250 btrfs_mark_buffer_dirty(leaf);
1251
cf27e1ee 1252 if (refs == 0) {
db94535d
CM
1253 u64 super_used;
1254 u64 root_used;
78fae27e
CM
1255
1256 if (pin) {
db94535d 1257 ret = pin_down_bytes(root, bytenr, num_bytes, 0);
c549228f
Y
1258 if (ret > 0)
1259 mark_free = 1;
1260 BUG_ON(ret < 0);
78fae27e
CM
1261 }
1262
58176a96 1263 /* block accounting for super block */
db94535d
CM
1264 super_used = btrfs_super_bytes_used(&info->super_copy);
1265 btrfs_set_super_bytes_used(&info->super_copy,
1266 super_used - num_bytes);
58176a96
JB
1267
1268 /* block accounting for root item */
db94535d 1269 root_used = btrfs_root_used(&root->root_item);
5f39d397 1270 btrfs_set_root_used(&root->root_item,
db94535d 1271 root_used - num_bytes);
58176a96 1272
5caf2a00 1273 ret = btrfs_del_item(trans, extent_root, path);
54aa1f4d
CM
1274 if (ret) {
1275 return ret;
1276 }
db94535d 1277 ret = update_block_group(trans, root, bytenr, num_bytes, 0,
1e2677e0 1278 mark_free, 0);
9078a3e1 1279 BUG_ON(ret);
a28ec197 1280 }
5caf2a00 1281 btrfs_free_path(path);
e089f05c 1282 finish_current_insert(trans, extent_root);
a28ec197
CM
1283 return ret;
1284}
1285
a28ec197
CM
1286/*
1287 * find all the blocks marked as pending in the radix tree and remove
1288 * them from the extent map
1289 */
e089f05c
CM
1290static int del_pending_extents(struct btrfs_trans_handle *trans, struct
1291 btrfs_root *extent_root)
a28ec197
CM
1292{
1293 int ret;
e20d96d6 1294 int err = 0;
1a5bc167
CM
1295 u64 start;
1296 u64 end;
1297 struct extent_map_tree *pending_del;
1298 struct extent_map_tree *pinned_extents;
8ef97622 1299
1a5bc167
CM
1300 pending_del = &extent_root->fs_info->pending_del;
1301 pinned_extents = &extent_root->fs_info->pinned_extents;
a28ec197
CM
1302
1303 while(1) {
1a5bc167
CM
1304 ret = find_first_extent_bit(pending_del, 0, &start, &end,
1305 EXTENT_LOCKED);
1306 if (ret)
a28ec197 1307 break;
324ae4df 1308 update_pinned_extents(extent_root, start, end + 1 - start, 1);
1a5bc167
CM
1309 clear_extent_bits(pending_del, start, end, EXTENT_LOCKED,
1310 GFP_NOFS);
1311 ret = __free_extent(trans, extent_root,
7bb86316
CM
1312 start, end + 1 - start,
1313 extent_root->root_key.objectid,
1314 0, 0, 0, 0, 0);
1a5bc167
CM
1315 if (ret)
1316 err = ret;
fec577fb 1317 }
e20d96d6 1318 return err;
fec577fb
CM
1319}
1320
1321/*
1322 * remove an extent from the root, returns 0 on success
1323 */
e089f05c 1324int btrfs_free_extent(struct btrfs_trans_handle *trans, struct btrfs_root
7bb86316
CM
1325 *root, u64 bytenr, u64 num_bytes,
1326 u64 root_objectid, u64 ref_generation,
1327 u64 owner_objectid, u64 owner_offset, int pin)
fec577fb 1328{
9f5fae2f 1329 struct btrfs_root *extent_root = root->fs_info->extent_root;
fec577fb
CM
1330 int pending_ret;
1331 int ret;
a28ec197 1332
db94535d 1333 WARN_ON(num_bytes < root->sectorsize);
7bb86316
CM
1334 if (!root->ref_cows)
1335 ref_generation = 0;
1336
fec577fb 1337 if (root == extent_root) {
db94535d 1338 pin_down_bytes(root, bytenr, num_bytes, 1);
fec577fb
CM
1339 return 0;
1340 }
7bb86316
CM
1341 ret = __free_extent(trans, root, bytenr, num_bytes, root_objectid,
1342 ref_generation, owner_objectid, owner_offset,
1343 pin, pin == 0);
e20d96d6 1344 pending_ret = del_pending_extents(trans, root->fs_info->extent_root);
fec577fb
CM
1345 return ret ? ret : pending_ret;
1346}
1347
87ee04eb
CM
1348static u64 stripe_align(struct btrfs_root *root, u64 val)
1349{
1350 u64 mask = ((u64)root->stripesize - 1);
1351 u64 ret = (val + mask) & ~mask;
1352 return ret;
1353}
1354
fec577fb
CM
1355/*
1356 * walks the btree of allocated extents and find a hole of a given size.
1357 * The key ins is changed to record the hole:
1358 * ins->objectid == block start
62e2749e 1359 * ins->flags = BTRFS_EXTENT_ITEM_KEY
fec577fb
CM
1360 * ins->offset == number of blocks
1361 * Any available blocks before search_start are skipped.
1362 */
e089f05c 1363static int find_free_extent(struct btrfs_trans_handle *trans, struct btrfs_root
db94535d
CM
1364 *orig_root, u64 num_bytes, u64 empty_size,
1365 u64 search_start, u64 search_end, u64 hint_byte,
f2654de4
CM
1366 struct btrfs_key *ins, u64 exclude_start,
1367 u64 exclude_nr, int data)
fec577fb 1368{
5caf2a00 1369 struct btrfs_path *path;
e2fa7227 1370 struct btrfs_key key;
fec577fb 1371 u64 hole_size = 0;
87ee04eb
CM
1372 u64 aligned;
1373 int ret;
fec577fb 1374 int slot = 0;
db94535d 1375 u64 last_byte = 0;
be744175 1376 u64 orig_search_start = search_start;
fec577fb 1377 int start_found;
5f39d397 1378 struct extent_buffer *l;
9f5fae2f 1379 struct btrfs_root * root = orig_root->fs_info->extent_root;
f2458e1d 1380 struct btrfs_fs_info *info = root->fs_info;
db94535d 1381 u64 total_needed = num_bytes;
e20d96d6 1382 int level;
be08c1b9 1383 struct btrfs_block_group_cache *block_group;
be744175 1384 int full_scan = 0;
fbdc762b 1385 int wrapped = 0;
f84a8b36 1386 u64 cached_start;
fec577fb 1387
db94535d 1388 WARN_ON(num_bytes < root->sectorsize);
b1a4d965
CM
1389 btrfs_set_key_type(ins, BTRFS_EXTENT_ITEM_KEY);
1390
5f39d397
CM
1391 level = btrfs_header_level(root->node);
1392
015a739c 1393 if (num_bytes >= 32 * 1024 * 1024 && hint_byte) {
257d0ce3
CM
1394 data = BTRFS_BLOCK_GROUP_MIXED;
1395 }
1396
3e1ad54f 1397 if (search_end == (u64)-1)
db94535d
CM
1398 search_end = btrfs_super_total_bytes(&info->super_copy);
1399 if (hint_byte) {
1400 block_group = btrfs_lookup_block_group(info, hint_byte);
1a2b2ac7
CM
1401 if (!block_group)
1402 hint_byte = search_start;
be744175 1403 block_group = btrfs_find_block_group(root, block_group,
db94535d 1404 hint_byte, data, 1);
be744175
CM
1405 } else {
1406 block_group = btrfs_find_block_group(root,
1a2b2ac7
CM
1407 trans->block_group,
1408 search_start, data, 1);
be744175
CM
1409 }
1410
6702ed49 1411 total_needed += empty_size;
e011599b 1412 path = btrfs_alloc_path();
be744175 1413check_failed:
70b043f0
CM
1414 if (!block_group) {
1415 block_group = btrfs_lookup_block_group(info, search_start);
1416 if (!block_group)
1417 block_group = btrfs_lookup_block_group(info,
1418 orig_search_start);
1419 }
5e5745dc
Y
1420 search_start = find_search_start(root, &block_group, search_start,
1421 total_needed, data, full_scan);
87ee04eb 1422 search_start = stripe_align(root, search_start);
f84a8b36 1423 cached_start = search_start;
5caf2a00 1424 btrfs_init_path(path);
fec577fb
CM
1425 ins->objectid = search_start;
1426 ins->offset = 0;
fec577fb 1427 start_found = 0;
2cc58cf2 1428 path->reada = 2;
e37c9e69 1429
5caf2a00 1430 ret = btrfs_search_slot(trans, root, ins, path, 0, 0);
0f70abe2
CM
1431 if (ret < 0)
1432 goto error;
aa5d6bed 1433
e37c9e69 1434 if (path->slots[0] > 0) {
5caf2a00 1435 path->slots[0]--;
e37c9e69
CM
1436 }
1437
5f39d397
CM
1438 l = path->nodes[0];
1439 btrfs_item_key_to_cpu(l, &key, path->slots[0]);
1440
e37c9e69 1441 /*
7bb86316 1442 * walk backwards to find the first extent item key
e37c9e69 1443 */
7bb86316
CM
1444 while(btrfs_key_type(&key) != BTRFS_EXTENT_ITEM_KEY) {
1445 if (path->slots[0] == 0) {
1446 ret = btrfs_prev_leaf(root, path);
1447 if (ret != 0) {
1448 ret = btrfs_search_slot(trans, root, ins,
1449 path, 0, 0);
1450 if (ret < 0)
1451 goto error;
1452 if (path->slots[0] > 0)
1453 path->slots[0]--;
1454 break;
1455 }
1456 } else {
e37c9e69
CM
1457 path->slots[0]--;
1458 }
7bb86316
CM
1459 l = path->nodes[0];
1460 btrfs_item_key_to_cpu(l, &key, path->slots[0]);
e37c9e69 1461 }
fec577fb 1462 while (1) {
5f39d397 1463 l = path->nodes[0];
5caf2a00 1464 slot = path->slots[0];
5f39d397 1465 if (slot >= btrfs_header_nritems(l)) {
5caf2a00 1466 ret = btrfs_next_leaf(root, path);
fec577fb
CM
1467 if (ret == 0)
1468 continue;
0f70abe2
CM
1469 if (ret < 0)
1470 goto error;
e19caa5f
CM
1471
1472 search_start = max(search_start,
1473 block_group->key.objectid);
fec577fb 1474 if (!start_found) {
87ee04eb
CM
1475 aligned = stripe_align(root, search_start);
1476 ins->objectid = aligned;
1477 if (aligned >= search_end) {
1478 ret = -ENOSPC;
1479 goto error;
1480 }
1481 ins->offset = search_end - aligned;
fec577fb
CM
1482 start_found = 1;
1483 goto check_pending;
1484 }
87ee04eb
CM
1485 ins->objectid = stripe_align(root,
1486 last_byte > search_start ?
1487 last_byte : search_start);
1488 if (search_end <= ins->objectid) {
1489 ret = -ENOSPC;
1490 goto error;
1491 }
3e1ad54f 1492 ins->offset = search_end - ins->objectid;
e19caa5f 1493 BUG_ON(ins->objectid >= search_end);
fec577fb
CM
1494 goto check_pending;
1495 }
5f39d397 1496 btrfs_item_key_to_cpu(l, &key, slot);
96b5179d 1497
db94535d 1498 if (key.objectid >= search_start && key.objectid > last_byte &&
e37c9e69 1499 start_found) {
db94535d
CM
1500 if (last_byte < search_start)
1501 last_byte = search_start;
87ee04eb
CM
1502 aligned = stripe_align(root, last_byte);
1503 hole_size = key.objectid - aligned;
1504 if (key.objectid > aligned && hole_size >= num_bytes) {
1505 ins->objectid = aligned;
e37c9e69
CM
1506 ins->offset = hole_size;
1507 goto check_pending;
0579da42 1508 }
fec577fb 1509 }
96b5179d 1510 if (btrfs_key_type(&key) != BTRFS_EXTENT_ITEM_KEY) {
7bb86316
CM
1511 if (!start_found && btrfs_key_type(&key) ==
1512 BTRFS_BLOCK_GROUP_ITEM_KEY) {
db94535d 1513 last_byte = key.objectid;
96b5179d
CM
1514 start_found = 1;
1515 }
e37c9e69 1516 goto next;
96b5179d
CM
1517 }
1518
e37c9e69 1519
0579da42 1520 start_found = 1;
db94535d 1521 last_byte = key.objectid + key.offset;
f510cfec 1522
257d0ce3
CM
1523 if (!full_scan && data != BTRFS_BLOCK_GROUP_MIXED &&
1524 last_byte >= block_group->key.objectid +
be744175
CM
1525 block_group->key.offset) {
1526 btrfs_release_path(root, path);
1527 search_start = block_group->key.objectid +
e19caa5f 1528 block_group->key.offset;
be744175
CM
1529 goto new_group;
1530 }
9078a3e1 1531next:
5caf2a00 1532 path->slots[0]++;
de428b63 1533 cond_resched();
fec577fb 1534 }
fec577fb
CM
1535check_pending:
1536 /* we have to make sure we didn't find an extent that has already
1537 * been allocated by the map tree or the original allocation
1538 */
5caf2a00 1539 btrfs_release_path(root, path);
fec577fb 1540 BUG_ON(ins->objectid < search_start);
e37c9e69 1541
db94535d 1542 if (ins->objectid + num_bytes >= search_end)
cf67582b 1543 goto enospc;
257d0ce3 1544 if (!full_scan && data != BTRFS_BLOCK_GROUP_MIXED &&
5cf66426 1545 ins->objectid + num_bytes > block_group->
e19caa5f
CM
1546 key.objectid + block_group->key.offset) {
1547 search_start = block_group->key.objectid +
1548 block_group->key.offset;
1549 goto new_group;
1550 }
1a5bc167 1551 if (test_range_bit(&info->extent_ins, ins->objectid,
db94535d
CM
1552 ins->objectid + num_bytes -1, EXTENT_LOCKED, 0)) {
1553 search_start = ins->objectid + num_bytes;
1a5bc167
CM
1554 goto new_group;
1555 }
1556 if (test_range_bit(&info->pinned_extents, ins->objectid,
db94535d
CM
1557 ins->objectid + num_bytes -1, EXTENT_DIRTY, 0)) {
1558 search_start = ins->objectid + num_bytes;
1a5bc167 1559 goto new_group;
fec577fb 1560 }
db94535d 1561 if (exclude_nr > 0 && (ins->objectid + num_bytes > exclude_start &&
f2654de4
CM
1562 ins->objectid < exclude_start + exclude_nr)) {
1563 search_start = exclude_start + exclude_nr;
1564 goto new_group;
1565 }
e37c9e69 1566 if (!data) {
5276aeda 1567 block_group = btrfs_lookup_block_group(info, ins->objectid);
26b8003f
CM
1568 if (block_group)
1569 trans->block_group = block_group;
f2458e1d 1570 }
db94535d 1571 ins->offset = num_bytes;
5caf2a00 1572 btrfs_free_path(path);
fec577fb 1573 return 0;
be744175
CM
1574
1575new_group:
db94535d 1576 if (search_start + num_bytes >= search_end) {
cf67582b 1577enospc:
be744175 1578 search_start = orig_search_start;
fbdc762b
CM
1579 if (full_scan) {
1580 ret = -ENOSPC;
1581 goto error;
1582 }
6702ed49
CM
1583 if (wrapped) {
1584 if (!full_scan)
1585 total_needed -= empty_size;
fbdc762b 1586 full_scan = 1;
1a2b2ac7 1587 data = BTRFS_BLOCK_GROUP_MIXED;
6702ed49 1588 } else
fbdc762b 1589 wrapped = 1;
be744175 1590 }
5276aeda 1591 block_group = btrfs_lookup_block_group(info, search_start);
fbdc762b 1592 cond_resched();
1a2b2ac7
CM
1593 block_group = btrfs_find_block_group(root, block_group,
1594 search_start, data, 0);
be744175
CM
1595 goto check_failed;
1596
0f70abe2 1597error:
5caf2a00
CM
1598 btrfs_release_path(root, path);
1599 btrfs_free_path(path);
0f70abe2 1600 return ret;
fec577fb 1601}
fec577fb
CM
1602/*
1603 * finds a free extent and does all the dirty work required for allocation
1604 * returns the key for the extent through ins, and a tree buffer for
1605 * the first block of the extent through buf.
1606 *
1607 * returns 0 if everything worked, non-zero otherwise.
1608 */
4d775673 1609int btrfs_alloc_extent(struct btrfs_trans_handle *trans,
7bb86316
CM
1610 struct btrfs_root *root,
1611 u64 num_bytes, u64 root_objectid, u64 ref_generation,
1612 u64 owner, u64 owner_offset,
1613 u64 empty_size, u64 hint_byte,
be08c1b9 1614 u64 search_end, struct btrfs_key *ins, int data)
fec577fb
CM
1615{
1616 int ret;
1617 int pending_ret;
db94535d 1618 u64 super_used, root_used;
fbdc762b 1619 u64 search_start = 0;
edbd8d4e 1620 u64 new_hint;
1261ec42
CM
1621 struct btrfs_fs_info *info = root->fs_info;
1622 struct btrfs_root *extent_root = info->extent_root;
234b63a0 1623 struct btrfs_extent_item extent_item;
7bb86316 1624 struct btrfs_path *path;
037e6390 1625
5f39d397 1626 btrfs_set_stack_extent_refs(&extent_item, 1);
8f662a76
CM
1627
1628 new_hint = max(hint_byte, root->fs_info->alloc_start);
edbd8d4e
CM
1629 if (new_hint < btrfs_super_total_bytes(&info->super_copy))
1630 hint_byte = new_hint;
8f662a76 1631
db94535d
CM
1632 WARN_ON(num_bytes < root->sectorsize);
1633 ret = find_free_extent(trans, root, num_bytes, empty_size,
1634 search_start, search_end, hint_byte, ins,
26b8003f
CM
1635 trans->alloc_exclude_start,
1636 trans->alloc_exclude_nr, data);
ccd467d6 1637 BUG_ON(ret);
f2654de4
CM
1638 if (ret)
1639 return ret;
fec577fb 1640
58176a96 1641 /* block accounting for super block */
db94535d
CM
1642 super_used = btrfs_super_bytes_used(&info->super_copy);
1643 btrfs_set_super_bytes_used(&info->super_copy, super_used + num_bytes);
26b8003f 1644
58176a96 1645 /* block accounting for root item */
db94535d
CM
1646 root_used = btrfs_root_used(&root->root_item);
1647 btrfs_set_root_used(&root->root_item, root_used + num_bytes);
58176a96 1648
f510cfec
CM
1649 clear_extent_dirty(&root->fs_info->free_space_cache,
1650 ins->objectid, ins->objectid + ins->offset - 1,
1651 GFP_NOFS);
1652
26b8003f 1653 if (root == extent_root) {
1a5bc167
CM
1654 set_extent_bits(&root->fs_info->extent_ins, ins->objectid,
1655 ins->objectid + ins->offset - 1,
1656 EXTENT_LOCKED, GFP_NOFS);
e19caa5f 1657 WARN_ON(data == 1);
26b8003f
CM
1658 goto update_block;
1659 }
1660
1661 WARN_ON(trans->alloc_exclude_nr);
1662 trans->alloc_exclude_start = ins->objectid;
1663 trans->alloc_exclude_nr = ins->offset;
e089f05c
CM
1664 ret = btrfs_insert_item(trans, extent_root, ins, &extent_item,
1665 sizeof(extent_item));
037e6390 1666
26b8003f
CM
1667 trans->alloc_exclude_start = 0;
1668 trans->alloc_exclude_nr = 0;
7bb86316
CM
1669 BUG_ON(ret);
1670
1671 path = btrfs_alloc_path();
1672 BUG_ON(!path);
1673 ret = btrfs_insert_extent_backref(trans, extent_root, path,
1674 ins->objectid, root_objectid,
1675 ref_generation, owner, owner_offset);
26b8003f 1676
ccd467d6 1677 BUG_ON(ret);
7bb86316 1678 btrfs_free_path(path);
e089f05c 1679 finish_current_insert(trans, extent_root);
e20d96d6 1680 pending_ret = del_pending_extents(trans, extent_root);
f510cfec 1681
e37c9e69 1682 if (ret) {
037e6390 1683 return ret;
e37c9e69
CM
1684 }
1685 if (pending_ret) {
037e6390 1686 return pending_ret;
e37c9e69 1687 }
26b8003f
CM
1688
1689update_block:
1e2677e0
CM
1690 ret = update_block_group(trans, root, ins->objectid, ins->offset, 1, 0,
1691 data);
fabb5681 1692 BUG_ON(ret);
037e6390 1693 return 0;
fec577fb
CM
1694}
1695
1696/*
1697 * helper function to allocate a block for a given tree
1698 * returns the tree buffer or NULL.
1699 */
5f39d397 1700struct extent_buffer *btrfs_alloc_free_block(struct btrfs_trans_handle *trans,
db94535d 1701 struct btrfs_root *root,
7bb86316
CM
1702 u32 blocksize,
1703 u64 root_objectid, u64 hint,
1704 u64 empty_size)
1705{
1706 u64 ref_generation;
1707
1708 if (root->ref_cows)
1709 ref_generation = trans->transid;
1710 else
1711 ref_generation = 0;
1712
1713
1714 return __btrfs_alloc_free_block(trans, root, blocksize, root_objectid,
1715 ref_generation, 0, 0, hint, empty_size);
1716}
1717
1718/*
1719 * helper function to allocate a block for a given tree
1720 * returns the tree buffer or NULL.
1721 */
1722struct extent_buffer *__btrfs_alloc_free_block(struct btrfs_trans_handle *trans,
1723 struct btrfs_root *root,
1724 u32 blocksize,
1725 u64 root_objectid,
1726 u64 ref_generation,
1727 u64 first_objectid,
1728 int level,
1729 u64 hint,
5f39d397 1730 u64 empty_size)
fec577fb 1731{
e2fa7227 1732 struct btrfs_key ins;
fec577fb 1733 int ret;
5f39d397 1734 struct extent_buffer *buf;
fec577fb 1735
7bb86316
CM
1736 ret = btrfs_alloc_extent(trans, root, blocksize,
1737 root_objectid, ref_generation,
f6dbff55 1738 level, first_objectid, empty_size, hint,
db94535d 1739 (u64)-1, &ins, 0);
fec577fb 1740 if (ret) {
54aa1f4d
CM
1741 BUG_ON(ret > 0);
1742 return ERR_PTR(ret);
fec577fb 1743 }
db94535d 1744 buf = btrfs_find_create_tree_block(root, ins.objectid, blocksize);
54aa1f4d 1745 if (!buf) {
7bb86316
CM
1746 btrfs_free_extent(trans, root, ins.objectid, blocksize,
1747 root->root_key.objectid, ref_generation,
1748 0, 0, 0);
54aa1f4d
CM
1749 return ERR_PTR(-ENOMEM);
1750 }
5f39d397
CM
1751 btrfs_set_buffer_uptodate(buf);
1752 set_extent_dirty(&trans->transaction->dirty_pages, buf->start,
1753 buf->start + buf->len - 1, GFP_NOFS);
19c00ddc
CM
1754 set_extent_bits(&BTRFS_I(root->fs_info->btree_inode)->extent_tree,
1755 buf->start, buf->start + buf->len - 1,
1756 EXTENT_CSUM, GFP_NOFS);
1757 buf->flags |= EXTENT_CSUM;
6b80053d 1758 btrfs_set_buffer_defrag(buf);
d3c2fdcf 1759 trans->blocks_used++;
fec577fb
CM
1760 return buf;
1761}
a28ec197 1762
6407bf6d 1763static int drop_leaf_ref(struct btrfs_trans_handle *trans,
5f39d397 1764 struct btrfs_root *root, struct extent_buffer *leaf)
6407bf6d 1765{
7bb86316
CM
1766 u64 leaf_owner;
1767 u64 leaf_generation;
5f39d397 1768 struct btrfs_key key;
6407bf6d
CM
1769 struct btrfs_file_extent_item *fi;
1770 int i;
1771 int nritems;
1772 int ret;
1773
5f39d397
CM
1774 BUG_ON(!btrfs_is_leaf(leaf));
1775 nritems = btrfs_header_nritems(leaf);
7bb86316
CM
1776 leaf_owner = btrfs_header_owner(leaf);
1777 leaf_generation = btrfs_header_generation(leaf);
1778
6407bf6d 1779 for (i = 0; i < nritems; i++) {
db94535d 1780 u64 disk_bytenr;
5f39d397
CM
1781
1782 btrfs_item_key_to_cpu(leaf, &key, i);
1783 if (btrfs_key_type(&key) != BTRFS_EXTENT_DATA_KEY)
6407bf6d
CM
1784 continue;
1785 fi = btrfs_item_ptr(leaf, i, struct btrfs_file_extent_item);
5f39d397
CM
1786 if (btrfs_file_extent_type(leaf, fi) ==
1787 BTRFS_FILE_EXTENT_INLINE)
236454df 1788 continue;
6407bf6d
CM
1789 /*
1790 * FIXME make sure to insert a trans record that
1791 * repeats the snapshot del on crash
1792 */
db94535d
CM
1793 disk_bytenr = btrfs_file_extent_disk_bytenr(leaf, fi);
1794 if (disk_bytenr == 0)
3a686375 1795 continue;
db94535d 1796 ret = btrfs_free_extent(trans, root, disk_bytenr,
7bb86316
CM
1797 btrfs_file_extent_disk_num_bytes(leaf, fi),
1798 leaf_owner, leaf_generation,
1799 key.objectid, key.offset, 0);
6407bf6d
CM
1800 BUG_ON(ret);
1801 }
1802 return 0;
1803}
1804
e011599b 1805static void reada_walk_down(struct btrfs_root *root,
5f39d397 1806 struct extent_buffer *node)
e011599b
CM
1807{
1808 int i;
1809 u32 nritems;
db94535d 1810 u64 bytenr;
e011599b
CM
1811 int ret;
1812 u32 refs;
db94535d
CM
1813 int level;
1814 u32 blocksize;
e011599b 1815
5f39d397 1816 nritems = btrfs_header_nritems(node);
db94535d 1817 level = btrfs_header_level(node);
e011599b 1818 for (i = 0; i < nritems; i++) {
db94535d
CM
1819 bytenr = btrfs_node_blockptr(node, i);
1820 blocksize = btrfs_level_size(root, level - 1);
1821 ret = lookup_extent_ref(NULL, root, bytenr, blocksize, &refs);
e011599b
CM
1822 BUG_ON(ret);
1823 if (refs != 1)
1824 continue;
409eb95d 1825 mutex_unlock(&root->fs_info->fs_mutex);
db94535d 1826 ret = readahead_tree_block(root, bytenr, blocksize);
409eb95d
CM
1827 cond_resched();
1828 mutex_lock(&root->fs_info->fs_mutex);
e011599b
CM
1829 if (ret)
1830 break;
1831 }
1832}
1833
9aca1d51
CM
1834/*
1835 * helper function for drop_snapshot, this walks down the tree dropping ref
1836 * counts as it goes.
1837 */
e089f05c
CM
1838static int walk_down_tree(struct btrfs_trans_handle *trans, struct btrfs_root
1839 *root, struct btrfs_path *path, int *level)
20524f02 1840{
7bb86316
CM
1841 u64 root_owner;
1842 u64 root_gen;
1843 u64 bytenr;
5f39d397
CM
1844 struct extent_buffer *next;
1845 struct extent_buffer *cur;
7bb86316 1846 struct extent_buffer *parent;
db94535d 1847 u32 blocksize;
20524f02
CM
1848 int ret;
1849 u32 refs;
1850
5caf2a00
CM
1851 WARN_ON(*level < 0);
1852 WARN_ON(*level >= BTRFS_MAX_LEVEL);
5f39d397 1853 ret = lookup_extent_ref(trans, root,
db94535d
CM
1854 path->nodes[*level]->start,
1855 path->nodes[*level]->len, &refs);
20524f02
CM
1856 BUG_ON(ret);
1857 if (refs > 1)
1858 goto out;
e011599b 1859
9aca1d51
CM
1860 /*
1861 * walk down to the last node level and free all the leaves
1862 */
6407bf6d 1863 while(*level >= 0) {
5caf2a00
CM
1864 WARN_ON(*level < 0);
1865 WARN_ON(*level >= BTRFS_MAX_LEVEL);
20524f02 1866 cur = path->nodes[*level];
e011599b
CM
1867
1868 if (*level > 0 && path->slots[*level] == 0)
5f39d397 1869 reada_walk_down(root, cur);
e011599b 1870
5f39d397 1871 if (btrfs_header_level(cur) != *level)
2c90e5d6 1872 WARN_ON(1);
e011599b 1873
7518a238 1874 if (path->slots[*level] >=
5f39d397 1875 btrfs_header_nritems(cur))
20524f02 1876 break;
6407bf6d
CM
1877 if (*level == 0) {
1878 ret = drop_leaf_ref(trans, root, cur);
1879 BUG_ON(ret);
1880 break;
1881 }
db94535d
CM
1882 bytenr = btrfs_node_blockptr(cur, path->slots[*level]);
1883 blocksize = btrfs_level_size(root, *level - 1);
1884 ret = lookup_extent_ref(trans, root, bytenr, blocksize, &refs);
6407bf6d
CM
1885 BUG_ON(ret);
1886 if (refs != 1) {
7bb86316
CM
1887 parent = path->nodes[*level];
1888 root_owner = btrfs_header_owner(parent);
1889 root_gen = btrfs_header_generation(parent);
20524f02 1890 path->slots[*level]++;
db94535d 1891 ret = btrfs_free_extent(trans, root, bytenr,
7bb86316
CM
1892 blocksize, root_owner,
1893 root_gen, 0, 0, 1);
20524f02
CM
1894 BUG_ON(ret);
1895 continue;
1896 }
db94535d 1897 next = btrfs_find_tree_block(root, bytenr, blocksize);
5f39d397
CM
1898 if (!next || !btrfs_buffer_uptodate(next)) {
1899 free_extent_buffer(next);
e9d0b13b 1900 mutex_unlock(&root->fs_info->fs_mutex);
db94535d 1901 next = read_tree_block(root, bytenr, blocksize);
e9d0b13b
CM
1902 mutex_lock(&root->fs_info->fs_mutex);
1903
1904 /* we dropped the lock, check one more time */
db94535d
CM
1905 ret = lookup_extent_ref(trans, root, bytenr,
1906 blocksize, &refs);
e9d0b13b
CM
1907 BUG_ON(ret);
1908 if (refs != 1) {
7bb86316
CM
1909 parent = path->nodes[*level];
1910 root_owner = btrfs_header_owner(parent);
1911 root_gen = btrfs_header_generation(parent);
1912
e9d0b13b 1913 path->slots[*level]++;
5f39d397 1914 free_extent_buffer(next);
7bb86316
CM
1915 ret = btrfs_free_extent(trans, root, bytenr,
1916 blocksize,
1917 root_owner,
1918 root_gen, 0, 0, 1);
e9d0b13b
CM
1919 BUG_ON(ret);
1920 continue;
1921 }
1922 }
5caf2a00 1923 WARN_ON(*level <= 0);
83e15a28 1924 if (path->nodes[*level-1])
5f39d397 1925 free_extent_buffer(path->nodes[*level-1]);
20524f02 1926 path->nodes[*level-1] = next;
5f39d397 1927 *level = btrfs_header_level(next);
20524f02
CM
1928 path->slots[*level] = 0;
1929 }
1930out:
5caf2a00
CM
1931 WARN_ON(*level < 0);
1932 WARN_ON(*level >= BTRFS_MAX_LEVEL);
7bb86316
CM
1933
1934 if (path->nodes[*level] == root->node) {
1935 root_owner = root->root_key.objectid;
1936 parent = path->nodes[*level];
1937 } else {
1938 parent = path->nodes[*level + 1];
1939 root_owner = btrfs_header_owner(parent);
1940 }
1941
1942 root_gen = btrfs_header_generation(parent);
db94535d 1943 ret = btrfs_free_extent(trans, root, path->nodes[*level]->start,
7bb86316
CM
1944 path->nodes[*level]->len,
1945 root_owner, root_gen, 0, 0, 1);
5f39d397 1946 free_extent_buffer(path->nodes[*level]);
20524f02
CM
1947 path->nodes[*level] = NULL;
1948 *level += 1;
1949 BUG_ON(ret);
1950 return 0;
1951}
1952
9aca1d51
CM
1953/*
1954 * helper for dropping snapshots. This walks back up the tree in the path
1955 * to find the first node higher up where we haven't yet gone through
1956 * all the slots
1957 */
e089f05c
CM
1958static int walk_up_tree(struct btrfs_trans_handle *trans, struct btrfs_root
1959 *root, struct btrfs_path *path, int *level)
20524f02 1960{
7bb86316
CM
1961 u64 root_owner;
1962 u64 root_gen;
1963 struct btrfs_root_item *root_item = &root->root_item;
20524f02
CM
1964 int i;
1965 int slot;
1966 int ret;
9f3a7427 1967
234b63a0 1968 for(i = *level; i < BTRFS_MAX_LEVEL - 1 && path->nodes[i]; i++) {
20524f02 1969 slot = path->slots[i];
5f39d397
CM
1970 if (slot < btrfs_header_nritems(path->nodes[i]) - 1) {
1971 struct extent_buffer *node;
1972 struct btrfs_disk_key disk_key;
1973 node = path->nodes[i];
20524f02
CM
1974 path->slots[i]++;
1975 *level = i;
9f3a7427 1976 WARN_ON(*level == 0);
5f39d397 1977 btrfs_node_key(node, &disk_key, path->slots[i]);
9f3a7427 1978 memcpy(&root_item->drop_progress,
5f39d397 1979 &disk_key, sizeof(disk_key));
9f3a7427 1980 root_item->drop_level = i;
20524f02
CM
1981 return 0;
1982 } else {
7bb86316
CM
1983 if (path->nodes[*level] == root->node) {
1984 root_owner = root->root_key.objectid;
1985 root_gen =
1986 btrfs_header_generation(path->nodes[*level]);
1987 } else {
1988 struct extent_buffer *node;
1989 node = path->nodes[*level + 1];
1990 root_owner = btrfs_header_owner(node);
1991 root_gen = btrfs_header_generation(node);
1992 }
e089f05c 1993 ret = btrfs_free_extent(trans, root,
db94535d 1994 path->nodes[*level]->start,
7bb86316
CM
1995 path->nodes[*level]->len,
1996 root_owner, root_gen, 0, 0, 1);
6407bf6d 1997 BUG_ON(ret);
5f39d397 1998 free_extent_buffer(path->nodes[*level]);
83e15a28 1999 path->nodes[*level] = NULL;
20524f02 2000 *level = i + 1;
20524f02
CM
2001 }
2002 }
2003 return 1;
2004}
2005
9aca1d51
CM
2006/*
2007 * drop the reference count on the tree rooted at 'snap'. This traverses
2008 * the tree freeing any blocks that have a ref count of zero after being
2009 * decremented.
2010 */
e089f05c 2011int btrfs_drop_snapshot(struct btrfs_trans_handle *trans, struct btrfs_root
9f3a7427 2012 *root)
20524f02 2013{
3768f368 2014 int ret = 0;
9aca1d51 2015 int wret;
20524f02 2016 int level;
5caf2a00 2017 struct btrfs_path *path;
20524f02
CM
2018 int i;
2019 int orig_level;
9f3a7427 2020 struct btrfs_root_item *root_item = &root->root_item;
20524f02 2021
5caf2a00
CM
2022 path = btrfs_alloc_path();
2023 BUG_ON(!path);
20524f02 2024
5f39d397 2025 level = btrfs_header_level(root->node);
20524f02 2026 orig_level = level;
9f3a7427
CM
2027 if (btrfs_disk_key_objectid(&root_item->drop_progress) == 0) {
2028 path->nodes[level] = root->node;
f510cfec 2029 extent_buffer_get(root->node);
9f3a7427
CM
2030 path->slots[level] = 0;
2031 } else {
2032 struct btrfs_key key;
5f39d397
CM
2033 struct btrfs_disk_key found_key;
2034 struct extent_buffer *node;
6702ed49 2035
9f3a7427 2036 btrfs_disk_key_to_cpu(&key, &root_item->drop_progress);
6702ed49
CM
2037 level = root_item->drop_level;
2038 path->lowest_level = level;
9f3a7427 2039 wret = btrfs_search_slot(NULL, root, &key, path, 0, 0);
6702ed49 2040 if (wret < 0) {
9f3a7427
CM
2041 ret = wret;
2042 goto out;
2043 }
5f39d397
CM
2044 node = path->nodes[level];
2045 btrfs_node_key(node, &found_key, path->slots[level]);
2046 WARN_ON(memcmp(&found_key, &root_item->drop_progress,
2047 sizeof(found_key)));
9f3a7427 2048 }
20524f02 2049 while(1) {
5caf2a00 2050 wret = walk_down_tree(trans, root, path, &level);
9aca1d51 2051 if (wret > 0)
20524f02 2052 break;
9aca1d51
CM
2053 if (wret < 0)
2054 ret = wret;
2055
5caf2a00 2056 wret = walk_up_tree(trans, root, path, &level);
9aca1d51 2057 if (wret > 0)
20524f02 2058 break;
9aca1d51
CM
2059 if (wret < 0)
2060 ret = wret;
409eb95d 2061 ret = -EAGAIN;
409eb95d 2062 break;
20524f02 2063 }
83e15a28 2064 for (i = 0; i <= orig_level; i++) {
5caf2a00 2065 if (path->nodes[i]) {
5f39d397 2066 free_extent_buffer(path->nodes[i]);
0f82731f 2067 path->nodes[i] = NULL;
83e15a28 2068 }
20524f02 2069 }
9f3a7427 2070out:
5caf2a00 2071 btrfs_free_path(path);
9aca1d51 2072 return ret;
20524f02 2073}
9078a3e1 2074
96b5179d 2075int btrfs_free_block_groups(struct btrfs_fs_info *info)
9078a3e1 2076{
96b5179d
CM
2077 u64 start;
2078 u64 end;
b97f9203 2079 u64 ptr;
9078a3e1 2080 int ret;
9078a3e1 2081 while(1) {
96b5179d
CM
2082 ret = find_first_extent_bit(&info->block_group_cache, 0,
2083 &start, &end, (unsigned int)-1);
2084 if (ret)
9078a3e1 2085 break;
b97f9203
Y
2086 ret = get_state_private(&info->block_group_cache, start, &ptr);
2087 if (!ret)
2088 kfree((void *)(unsigned long)ptr);
96b5179d
CM
2089 clear_extent_bits(&info->block_group_cache, start,
2090 end, (unsigned int)-1, GFP_NOFS);
9078a3e1 2091 }
e37c9e69 2092 while(1) {
f510cfec
CM
2093 ret = find_first_extent_bit(&info->free_space_cache, 0,
2094 &start, &end, EXTENT_DIRTY);
2095 if (ret)
e37c9e69 2096 break;
f510cfec
CM
2097 clear_extent_dirty(&info->free_space_cache, start,
2098 end, GFP_NOFS);
e37c9e69 2099 }
be744175
CM
2100 return 0;
2101}
2102
edbd8d4e
CM
2103static int relocate_inode_pages(struct inode *inode, u64 start, u64 len)
2104{
2105 u64 page_start;
2106 u64 page_end;
2107 u64 delalloc_start;
2108 u64 existing_delalloc;
2109 unsigned long last_index;
edbd8d4e
CM
2110 unsigned long i;
2111 struct page *page;
2112 struct btrfs_root *root = BTRFS_I(inode)->root;
2113 struct extent_map_tree *em_tree = &BTRFS_I(inode)->extent_tree;
4313b399
CM
2114 struct file_ra_state *ra;
2115
2116 ra = kzalloc(sizeof(*ra), GFP_NOFS);
edbd8d4e
CM
2117
2118 mutex_lock(&inode->i_mutex);
4313b399 2119 i = start >> PAGE_CACHE_SHIFT;
edbd8d4e
CM
2120 last_index = (start + len - 1) >> PAGE_CACHE_SHIFT;
2121
4313b399
CM
2122 file_ra_state_init(ra, inode->i_mapping);
2123 btrfs_force_ra(inode->i_mapping, ra, NULL, i, last_index);
2124 kfree(ra);
edbd8d4e 2125
4313b399 2126 for (; i <= last_index; i++) {
edbd8d4e
CM
2127 page = grab_cache_page(inode->i_mapping, i);
2128 if (!page)
2129 goto out_unlock;
2130 if (!PageUptodate(page)) {
2131 btrfs_readpage(NULL, page);
2132 lock_page(page);
2133 if (!PageUptodate(page)) {
2134 unlock_page(page);
2135 page_cache_release(page);
2136 goto out_unlock;
2137 }
2138 }
2139 page_start = (u64)page->index << PAGE_CACHE_SHIFT;
2140 page_end = page_start + PAGE_CACHE_SIZE - 1;
2141
2142 lock_extent(em_tree, page_start, page_end, GFP_NOFS);
2143
2144 delalloc_start = page_start;
2145 existing_delalloc =
2146 count_range_bits(&BTRFS_I(inode)->extent_tree,
2147 &delalloc_start, page_end,
2148 PAGE_CACHE_SIZE, EXTENT_DELALLOC);
2149
2150 set_extent_delalloc(em_tree, page_start,
2151 page_end, GFP_NOFS);
2152
2153 spin_lock(&root->fs_info->delalloc_lock);
2154 root->fs_info->delalloc_bytes += PAGE_CACHE_SIZE -
2155 existing_delalloc;
2156 spin_unlock(&root->fs_info->delalloc_lock);
2157
2158 unlock_extent(em_tree, page_start, page_end, GFP_NOFS);
2159 set_page_dirty(page);
2160 unlock_page(page);
2161 page_cache_release(page);
2162 }
2163
2164out_unlock:
2165 mutex_unlock(&inode->i_mutex);
2166 return 0;
2167}
2168
4313b399
CM
2169/*
2170 * note, this releases the path
2171 */
edbd8d4e
CM
2172static int relocate_one_reference(struct btrfs_root *extent_root,
2173 struct btrfs_path *path,
4313b399 2174 struct btrfs_key *extent_key)
edbd8d4e
CM
2175{
2176 struct inode *inode;
2177 struct btrfs_root *found_root;
4313b399
CM
2178 struct btrfs_key *root_location;
2179 struct btrfs_extent_ref *ref;
2180 u64 ref_root;
2181 u64 ref_gen;
2182 u64 ref_objectid;
2183 u64 ref_offset;
edbd8d4e
CM
2184 int ret;
2185
4313b399
CM
2186 ref = btrfs_item_ptr(path->nodes[0], path->slots[0],
2187 struct btrfs_extent_ref);
2188 ref_root = btrfs_ref_root(path->nodes[0], ref);
2189 ref_gen = btrfs_ref_generation(path->nodes[0], ref);
2190 ref_objectid = btrfs_ref_objectid(path->nodes[0], ref);
2191 ref_offset = btrfs_ref_offset(path->nodes[0], ref);
2192 btrfs_release_path(extent_root, path);
2193
2194 root_location = kmalloc(sizeof(*root_location), GFP_NOFS);
2195 root_location->objectid = ref_root;
edbd8d4e 2196 if (ref_gen == 0)
4313b399 2197 root_location->offset = 0;
edbd8d4e 2198 else
4313b399
CM
2199 root_location->offset = (u64)-1;
2200 root_location->type = BTRFS_ROOT_ITEM_KEY;
edbd8d4e
CM
2201
2202 found_root = btrfs_read_fs_root_no_name(extent_root->fs_info,
4313b399 2203 root_location);
edbd8d4e 2204 BUG_ON(!found_root);
4313b399 2205 kfree(root_location);
edbd8d4e
CM
2206
2207 if (ref_objectid >= BTRFS_FIRST_FREE_OBJECTID) {
2208 mutex_unlock(&extent_root->fs_info->fs_mutex);
2209 inode = btrfs_iget_locked(extent_root->fs_info->sb,
2210 ref_objectid, found_root);
2211 if (inode->i_state & I_NEW) {
2212 /* the inode and parent dir are two different roots */
2213 BTRFS_I(inode)->root = found_root;
2214 BTRFS_I(inode)->location.objectid = ref_objectid;
2215 BTRFS_I(inode)->location.type = BTRFS_INODE_ITEM_KEY;
2216 BTRFS_I(inode)->location.offset = 0;
2217 btrfs_read_locked_inode(inode);
2218 unlock_new_inode(inode);
2219
2220 }
2221 /* this can happen if the reference is not against
2222 * the latest version of the tree root
2223 */
2224 if (is_bad_inode(inode)) {
2225 mutex_lock(&extent_root->fs_info->fs_mutex);
2226 goto out;
2227 }
2228 relocate_inode_pages(inode, ref_offset, extent_key->offset);
2229 /* FIXME, data=ordered will help get rid of this */
2230 filemap_fdatawrite(inode->i_mapping);
2231 iput(inode);
2232 mutex_lock(&extent_root->fs_info->fs_mutex);
2233 } else {
2234 struct btrfs_trans_handle *trans;
2235 struct btrfs_key found_key;
2236 struct extent_buffer *eb;
2237 int level;
2238 int i;
2239
2240 trans = btrfs_start_transaction(found_root, 1);
2241 eb = read_tree_block(found_root, extent_key->objectid,
2242 extent_key->offset);
2243 level = btrfs_header_level(eb);
2244
2245 if (level == 0)
2246 btrfs_item_key_to_cpu(eb, &found_key, 0);
2247 else
2248 btrfs_node_key_to_cpu(eb, &found_key, 0);
2249
2250 free_extent_buffer(eb);
2251
2252 path->lowest_level = level;
8f662a76 2253 path->reada = 2;
edbd8d4e
CM
2254 ret = btrfs_search_slot(trans, found_root, &found_key, path,
2255 0, 1);
2256 path->lowest_level = 0;
2257 for (i = level; i < BTRFS_MAX_LEVEL; i++) {
2258 if (!path->nodes[i])
2259 break;
2260 free_extent_buffer(path->nodes[i]);
2261 path->nodes[i] = NULL;
2262 }
2263 btrfs_release_path(found_root, path);
2264 btrfs_end_transaction(trans, found_root);
2265 }
2266
2267out:
2268 return 0;
2269}
2270
2271static int relocate_one_extent(struct btrfs_root *extent_root,
2272 struct btrfs_path *path,
2273 struct btrfs_key *extent_key)
2274{
2275 struct btrfs_key key;
2276 struct btrfs_key found_key;
edbd8d4e 2277 struct extent_buffer *leaf;
edbd8d4e
CM
2278 u32 nritems;
2279 u32 item_size;
2280 int ret = 0;
2281
2282 key.objectid = extent_key->objectid;
2283 key.type = BTRFS_EXTENT_REF_KEY;
2284 key.offset = 0;
2285
2286 while(1) {
2287 ret = btrfs_search_slot(NULL, extent_root, &key, path, 0, 0);
2288
2289 BUG_ON(ret == 0);
2290
2291 if (ret < 0)
2292 goto out;
2293
2294 ret = 0;
2295 leaf = path->nodes[0];
2296 nritems = btrfs_header_nritems(leaf);
2297 if (path->slots[0] == nritems)
2298 goto out;
2299
2300 btrfs_item_key_to_cpu(leaf, &found_key, path->slots[0]);
2301 if (found_key.objectid != extent_key->objectid)
2302 break;
2303
2304 if (found_key.type != BTRFS_EXTENT_REF_KEY)
2305 break;
2306
2307 key.offset = found_key.offset + 1;
2308 item_size = btrfs_item_size_nr(leaf, path->slots[0]);
2309
4313b399 2310 ret = relocate_one_reference(extent_root, path, extent_key);
edbd8d4e
CM
2311 if (ret)
2312 goto out;
2313 }
2314 ret = 0;
2315out:
2316 btrfs_release_path(extent_root, path);
2317 return ret;
2318}
2319
2320static int find_overlapping_extent(struct btrfs_root *root,
2321 struct btrfs_path *path, u64 new_size)
2322{
2323 struct btrfs_key found_key;
2324 struct extent_buffer *leaf;
2325 int ret;
2326
2327 while(1) {
2328 if (path->slots[0] == 0) {
2329 ret = btrfs_prev_leaf(root, path);
2330 if (ret == 1) {
2331 return 1;
2332 }
2333 if (ret < 0)
2334 return ret;
2335 } else {
2336 path->slots[0]--;
2337 }
2338 leaf = path->nodes[0];
2339 btrfs_item_key_to_cpu(leaf, &found_key, path->slots[0]);
2340 if (found_key.type == BTRFS_EXTENT_ITEM_KEY) {
2341 if (found_key.objectid + found_key.offset > new_size)
2342 return 0;
2343 else
2344 return 1;
2345 }
2346 }
2347 return 1;
2348}
2349
2350int btrfs_shrink_extent_tree(struct btrfs_root *root, u64 new_size)
2351{
2352 struct btrfs_trans_handle *trans;
2353 struct btrfs_root *tree_root = root->fs_info->tree_root;
2354 struct btrfs_path *path;
2355 u64 cur_byte;
2356 u64 total_found;
edbd8d4e
CM
2357 struct btrfs_fs_info *info = root->fs_info;
2358 struct extent_map_tree *block_group_cache;
2359 struct btrfs_key key;
2360 struct btrfs_key found_key = { 0, 0, 0 };
2361 struct extent_buffer *leaf;
2362 u32 nritems;
2363 int ret;
2364 int slot;
2365
2366 btrfs_set_super_total_bytes(&info->super_copy, new_size);
2367 block_group_cache = &info->block_group_cache;
2368 path = btrfs_alloc_path();
2369 root = root->fs_info->extent_root;
8f662a76 2370 path->reada = 2;
edbd8d4e
CM
2371
2372again:
2373 total_found = 0;
2374 key.objectid = new_size;
2375 cur_byte = key.objectid;
2376 key.offset = 0;
2377 key.type = 0;
2378 while(1) {
4313b399 2379
edbd8d4e
CM
2380 ret = btrfs_search_slot(NULL, root, &key, path, 0, 0);
2381 if (ret < 0)
2382 goto out;
2383next:
2384 leaf = path->nodes[0];
2385 if (key.objectid == new_size - 1) {
2386 ret = find_overlapping_extent(root, path, new_size);
2387 if (ret != 0) {
2388 btrfs_release_path(root, path);
2389 ret = btrfs_search_slot(NULL, root, &key,
2390 path, 0, 0);
2391 if (ret < 0)
2392 goto out;
2393 }
2394 }
2395 nritems = btrfs_header_nritems(leaf);
2396 ret = 0;
2397 slot = path->slots[0];
2398 if (slot < nritems)
2399 btrfs_item_key_to_cpu(leaf, &found_key, slot);
2400 if (slot == nritems ||
2401 btrfs_key_type(&found_key) != BTRFS_EXTENT_ITEM_KEY) {
2402 path->slots[0]++;
2403 if (path->slots[0] >= nritems) {
2404 ret = btrfs_next_leaf(root, path);
2405 if (ret < 0)
2406 goto out;
2407 if (ret == 1) {
2408 ret = 0;
2409 break;
2410 }
2411 }
2412 goto next;
2413 }
2414 btrfs_item_key_to_cpu(leaf, &found_key, slot);
2415 if (found_key.objectid + found_key.offset <= cur_byte)
2416 continue;
2417 total_found++;
2418 cur_byte = found_key.objectid + found_key.offset;
2419 key.objectid = cur_byte;
2420 btrfs_release_path(root, path);
2421 ret = relocate_one_extent(root, path, &found_key);
2422 }
2423
2424 btrfs_release_path(root, path);
2425
2426 if (total_found > 0) {
2427 trans = btrfs_start_transaction(tree_root, 1);
2428 btrfs_commit_transaction(trans, tree_root);
2429
2430 mutex_unlock(&root->fs_info->fs_mutex);
2431 btrfs_clean_old_snapshots(tree_root);
2432 mutex_lock(&root->fs_info->fs_mutex);
2433
2434 trans = btrfs_start_transaction(tree_root, 1);
2435 btrfs_commit_transaction(trans, tree_root);
2436 goto again;
2437 }
2438
2439 trans = btrfs_start_transaction(root, 1);
2440 key.objectid = new_size;
2441 key.offset = 0;
2442 key.type = 0;
2443 while(1) {
4313b399
CM
2444 u64 ptr;
2445
edbd8d4e
CM
2446 ret = btrfs_search_slot(trans, root, &key, path, -1, 1);
2447 if (ret < 0)
2448 goto out;
2449bg_next:
2450 leaf = path->nodes[0];
2451 nritems = btrfs_header_nritems(leaf);
2452 ret = 0;
2453 slot = path->slots[0];
2454 if (slot < nritems)
2455 btrfs_item_key_to_cpu(leaf, &found_key, slot);
2456 if (slot == nritems ||
2457 btrfs_key_type(&found_key) != BTRFS_BLOCK_GROUP_ITEM_KEY) {
2458 if (slot < nritems) {
2459 printk("shrinker found key %Lu %u %Lu\n",
2460 found_key.objectid, found_key.type,
2461 found_key.offset);
2462 path->slots[0]++;
2463 }
2464 if (path->slots[0] >= nritems) {
2465 ret = btrfs_next_leaf(root, path);
2466 if (ret < 0)
2467 break;
2468 if (ret == 1) {
2469 ret = 0;
2470 break;
2471 }
2472 }
2473 goto bg_next;
2474 }
2475 btrfs_item_key_to_cpu(leaf, &found_key, slot);
2476 ret = get_state_private(&info->block_group_cache,
2477 found_key.objectid, &ptr);
2478 if (!ret)
2479 kfree((void *)(unsigned long)ptr);
2480
2481 clear_extent_bits(&info->block_group_cache, found_key.objectid,
2482 found_key.objectid + found_key.offset - 1,
2483 (unsigned int)-1, GFP_NOFS);
2484
2485 key.objectid = found_key.objectid + 1;
2486 btrfs_del_item(trans, root, path);
2487 btrfs_release_path(root, path);
2488 }
2489 clear_extent_dirty(&info->free_space_cache, new_size, (u64)-1,
2490 GFP_NOFS);
2491 btrfs_commit_transaction(trans, root);
2492out:
2493 btrfs_free_path(path);
2494 return ret;
2495}
2496
2497int btrfs_grow_extent_tree(struct btrfs_trans_handle *trans,
2498 struct btrfs_root *root, u64 new_size)
2499{
2500 struct btrfs_path *path;
2501 u64 nr = 0;
2502 u64 cur_byte;
2503 u64 old_size;
f9ef6604 2504 unsigned long rem;
edbd8d4e
CM
2505 struct btrfs_block_group_cache *cache;
2506 struct btrfs_block_group_item *item;
2507 struct btrfs_fs_info *info = root->fs_info;
2508 struct extent_map_tree *block_group_cache;
2509 struct btrfs_key key;
2510 struct extent_buffer *leaf;
2511 int ret;
2512 int bit;
2513
2514 old_size = btrfs_super_total_bytes(&info->super_copy);
2515 block_group_cache = &info->block_group_cache;
2516
2517 root = info->extent_root;
2518
2519 cache = btrfs_lookup_block_group(root->fs_info, old_size - 1);
2520
2521 cur_byte = cache->key.objectid + cache->key.offset;
2522 if (cur_byte >= new_size)
2523 goto set_size;
2524
2525 key.offset = BTRFS_BLOCK_GROUP_SIZE;
2526 btrfs_set_key_type(&key, BTRFS_BLOCK_GROUP_ITEM_KEY);
2527
2528 path = btrfs_alloc_path();
2529 if (!path)
2530 return -ENOMEM;
2531
2532 while(cur_byte < new_size) {
2533 key.objectid = cur_byte;
2534 ret = btrfs_insert_empty_item(trans, root, path, &key,
2535 sizeof(struct btrfs_block_group_item));
2536 BUG_ON(ret);
2537 leaf = path->nodes[0];
2538 item = btrfs_item_ptr(leaf, path->slots[0],
2539 struct btrfs_block_group_item);
2540
2541 btrfs_set_disk_block_group_used(leaf, item, 0);
f9ef6604
CM
2542 div_long_long_rem(nr, 3, &rem);
2543 if (rem) {
edbd8d4e
CM
2544 btrfs_set_disk_block_group_flags(leaf, item,
2545 BTRFS_BLOCK_GROUP_DATA);
2546 } else {
2547 btrfs_set_disk_block_group_flags(leaf, item, 0);
2548 }
2549 nr++;
2550
2551 cache = kmalloc(sizeof(*cache), GFP_NOFS);
2552 BUG_ON(!cache);
2553
2554 read_extent_buffer(leaf, &cache->item, (unsigned long)item,
2555 sizeof(cache->item));
2556
2557 memcpy(&cache->key, &key, sizeof(key));
2558 cache->cached = 0;
2559 cache->pinned = 0;
2560 cur_byte = key.objectid + key.offset;
2561 btrfs_release_path(root, path);
2562
2563 if (cache->item.flags & BTRFS_BLOCK_GROUP_DATA) {
2564 bit = BLOCK_GROUP_DATA;
2565 cache->data = BTRFS_BLOCK_GROUP_DATA;
2566 } else {
2567 bit = BLOCK_GROUP_METADATA;
2568 cache->data = 0;
2569 }
2570
2571 /* use EXTENT_LOCKED to prevent merging */
2572 set_extent_bits(block_group_cache, key.objectid,
2573 key.objectid + key.offset - 1,
2574 bit | EXTENT_LOCKED, GFP_NOFS);
2575 set_state_private(block_group_cache, key.objectid,
2576 (unsigned long)cache);
2577 }
2578 btrfs_free_path(path);
2579set_size:
2580 btrfs_set_super_total_bytes(&info->super_copy, new_size);
2581 return 0;
2582}
2583
9078a3e1
CM
2584int btrfs_read_block_groups(struct btrfs_root *root)
2585{
2586 struct btrfs_path *path;
2587 int ret;
2588 int err = 0;
96b5179d 2589 int bit;
9078a3e1 2590 struct btrfs_block_group_cache *cache;
be744175 2591 struct btrfs_fs_info *info = root->fs_info;
96b5179d 2592 struct extent_map_tree *block_group_cache;
9078a3e1
CM
2593 struct btrfs_key key;
2594 struct btrfs_key found_key;
5f39d397 2595 struct extent_buffer *leaf;
96b5179d
CM
2596
2597 block_group_cache = &info->block_group_cache;
9078a3e1 2598
be744175 2599 root = info->extent_root;
9078a3e1 2600 key.objectid = 0;
db94535d 2601 key.offset = BTRFS_BLOCK_GROUP_SIZE;
9078a3e1
CM
2602 btrfs_set_key_type(&key, BTRFS_BLOCK_GROUP_ITEM_KEY);
2603
2604 path = btrfs_alloc_path();
2605 if (!path)
2606 return -ENOMEM;
2607
2608 while(1) {
be744175 2609 ret = btrfs_search_slot(NULL, info->extent_root,
9078a3e1
CM
2610 &key, path, 0, 0);
2611 if (ret != 0) {
2612 err = ret;
2613 break;
2614 }
5f39d397
CM
2615 leaf = path->nodes[0];
2616 btrfs_item_key_to_cpu(leaf, &found_key, path->slots[0]);
9078a3e1
CM
2617 cache = kmalloc(sizeof(*cache), GFP_NOFS);
2618 if (!cache) {
2619 err = -1;
2620 break;
2621 }
3e1ad54f 2622
5f39d397
CM
2623 read_extent_buffer(leaf, &cache->item,
2624 btrfs_item_ptr_offset(leaf, path->slots[0]),
2625 sizeof(cache->item));
9078a3e1 2626 memcpy(&cache->key, &found_key, sizeof(found_key));
e37c9e69 2627 cache->cached = 0;
324ae4df 2628 cache->pinned = 0;
9078a3e1
CM
2629 key.objectid = found_key.objectid + found_key.offset;
2630 btrfs_release_path(root, path);
5f39d397 2631
f84a8b36
CM
2632 if (cache->item.flags & BTRFS_BLOCK_GROUP_MIXED) {
2633 bit = BLOCK_GROUP_DATA | BLOCK_GROUP_METADATA;
2634 cache->data = BTRFS_BLOCK_GROUP_MIXED;
2635 } else if (cache->item.flags & BTRFS_BLOCK_GROUP_DATA) {
96b5179d 2636 bit = BLOCK_GROUP_DATA;
f84a8b36 2637 cache->data = BTRFS_BLOCK_GROUP_DATA;
96b5179d
CM
2638 } else {
2639 bit = BLOCK_GROUP_METADATA;
2640 cache->data = 0;
31f3c99b 2641 }
96b5179d
CM
2642
2643 /* use EXTENT_LOCKED to prevent merging */
2644 set_extent_bits(block_group_cache, found_key.objectid,
2645 found_key.objectid + found_key.offset - 1,
2646 bit | EXTENT_LOCKED, GFP_NOFS);
2647 set_state_private(block_group_cache, found_key.objectid,
ae2f5411 2648 (unsigned long)cache);
96b5179d 2649
9078a3e1 2650 if (key.objectid >=
db94535d 2651 btrfs_super_total_bytes(&info->super_copy))
9078a3e1
CM
2652 break;
2653 }
2654
2655 btrfs_free_path(path);
2656 return 0;
2657}