2 * Copyright (C) 2007 Oracle. All rights reserved.
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public
6 * License v2 as published by the Free Software Foundation.
8 * This program is distributed in the hope that it will be useful,
9 * but WITHOUT ANY WARRANTY; without even the implied warranty of
10 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
11 * General Public License for more details.
13 * You should have received a copy of the GNU General Public
14 * License along with this program; if not, write to the
15 * Free Software Foundation, Inc., 59 Temple Place - Suite 330,
16 * Boston, MA 021110-1307, USA.
19 #define _XOPEN_SOURCE 600
24 #include <sys/types.h>
28 #include "kerncompat.h"
29 #include "radix-tree.h"
33 #include "transaction.h"
36 #include "print-tree.h"
38 static int check_tree_block(struct btrfs_root *root, struct extent_buffer *buf)
40 if (buf->start != btrfs_header_bytenr(buf))
43 if (memcmp_extent_buffer(buf, root->fs_info->fsid,
44 (unsigned long)btrfs_header_fsid(buf),
50 u32 btrfs_csum_data(struct btrfs_root *root, char *data, u32 seed, size_t len)
52 return crc32c(seed, data, len);
55 void btrfs_csum_final(u32 crc, char *result)
57 *(__le32 *)result = ~cpu_to_le32(crc);
60 int csum_tree_block(struct btrfs_root *root, struct extent_buffer *buf,
63 char result[BTRFS_CRC32_SIZE];
67 len = buf->len - BTRFS_CSUM_SIZE;
68 crc = crc32c(crc, buf->data + BTRFS_CSUM_SIZE, len);
69 btrfs_csum_final(crc, result);
72 if (memcmp_extent_buffer(buf, result, 0, BTRFS_CRC32_SIZE)) {
73 printk("checksum verify failed on %llu wanted %X "
74 "found %X\n", (unsigned long long)buf->start,
75 *((int *)result), *((int *)buf));
79 write_extent_buffer(buf, result, 0, BTRFS_CRC32_SIZE);
84 struct extent_buffer *btrfs_find_tree_block(struct btrfs_root *root,
85 u64 bytenr, u32 blocksize)
87 return find_extent_buffer(&root->fs_info->extent_cache,
91 struct extent_buffer *btrfs_find_create_tree_block(struct btrfs_root *root,
92 u64 bytenr, u32 blocksize)
94 return alloc_extent_buffer(&root->fs_info->extent_cache, bytenr,
98 int readahead_tree_block(struct btrfs_root *root, u64 bytenr, u32 blocksize)
102 struct extent_buffer *eb;
104 struct btrfs_multi_bio *multi = NULL;
105 struct btrfs_device *device;
107 eb = btrfs_find_tree_block(root, bytenr, blocksize);
108 if (eb && btrfs_buffer_uptodate(eb)) {
109 free_extent_buffer(eb);
115 ret = btrfs_map_block(&root->fs_info->mapping_tree, READ,
116 bytenr, &length, &multi, 0);
118 device = multi->stripes[0].dev;
120 blocksize = min(blocksize, (u32)(64 * 1024));
121 readahead(device->fd, multi->stripes[0].physical, blocksize);
126 struct extent_buffer *read_tree_block(struct btrfs_root *root, u64 bytenr,
131 struct extent_buffer *eb;
133 struct btrfs_multi_bio *multi = NULL;
134 struct btrfs_device *device;
138 eb = btrfs_find_create_tree_block(root, bytenr, blocksize);
142 if (btrfs_buffer_uptodate(eb))
148 ret = btrfs_map_block(&root->fs_info->mapping_tree, READ,
149 eb->start, &length, &multi, mirror_num);
151 device = multi->stripes[0].dev;
154 eb->dev_bytenr = multi->stripes[0].physical;
156 ret = read_extent_from_disk(eb);
157 if (ret == 0 && check_tree_block(root, eb) == 0 &&
158 csum_tree_block(root, eb, 1) == 0) {
159 btrfs_set_buffer_uptodate(eb);
162 num_copies = btrfs_num_copies(&root->fs_info->mapping_tree,
164 if (num_copies == 1) {
165 printk("reading %Lu failed only one copy\n", eb->start);
169 if (mirror_num > num_copies) {
170 printk("bailing at mirror %d of %d\n", mirror_num, num_copies);
174 free_extent_buffer(eb);
178 int write_tree_block(struct btrfs_trans_handle *trans, struct btrfs_root *root,
179 struct extent_buffer *eb)
184 struct btrfs_multi_bio *multi = NULL;
186 if (check_tree_block(root, eb))
188 if (!btrfs_buffer_uptodate(eb))
191 btrfs_set_header_flag(eb, BTRFS_HEADER_FLAG_WRITTEN);
192 csum_tree_block(root, eb, 0);
196 ret = btrfs_map_block(&root->fs_info->mapping_tree, WRITE,
197 eb->start, &length, &multi, 0);
199 while(dev_nr < multi->num_stripes) {
201 eb->fd = multi->stripes[dev_nr].dev->fd;
202 eb->dev_bytenr = multi->stripes[dev_nr].physical;
203 multi->stripes[dev_nr].dev->total_ios++;
205 ret = write_extent_to_disk(eb);
212 static int __setup_root(u32 nodesize, u32 leafsize, u32 sectorsize,
213 u32 stripesize, struct btrfs_root *root,
214 struct btrfs_fs_info *fs_info, u64 objectid)
217 root->commit_root = NULL;
218 root->sectorsize = sectorsize;
219 root->nodesize = nodesize;
220 root->leafsize = leafsize;
221 root->stripesize = stripesize;
223 root->track_dirty = 0;
225 root->fs_info = fs_info;
226 root->objectid = objectid;
227 root->last_trans = 0;
228 root->highest_inode = 0;
229 root->last_inode_alloc = 0;
231 INIT_LIST_HEAD(&root->dirty_list);
232 memset(&root->root_key, 0, sizeof(root->root_key));
233 memset(&root->root_item, 0, sizeof(root->root_item));
234 root->root_key.objectid = objectid;
238 static int update_cowonly_root(struct btrfs_trans_handle *trans,
239 struct btrfs_root *root)
243 struct btrfs_root *tree_root = root->fs_info->tree_root;
245 btrfs_write_dirty_block_groups(trans, root);
247 old_root_bytenr = btrfs_root_bytenr(&root->root_item);
248 if (old_root_bytenr == root->node->start)
250 btrfs_set_root_bytenr(&root->root_item,
252 root->root_item.level = btrfs_header_level(root->node);
253 ret = btrfs_update_root(trans, tree_root,
257 btrfs_write_dirty_block_groups(trans, root);
262 static int commit_tree_roots(struct btrfs_trans_handle *trans,
263 struct btrfs_fs_info *fs_info)
265 struct btrfs_root *root;
266 struct list_head *next;
268 while(!list_empty(&fs_info->dirty_cowonly_roots)) {
269 next = fs_info->dirty_cowonly_roots.next;
271 root = list_entry(next, struct btrfs_root, dirty_list);
272 update_cowonly_root(trans, root);
277 static int __commit_transaction(struct btrfs_trans_handle *trans,
278 struct btrfs_root *root)
282 struct extent_buffer *eb;
283 struct extent_io_tree *tree = &root->fs_info->extent_cache;
287 ret = find_first_extent_bit(tree, 0, &start, &end,
291 while(start <= end) {
292 eb = find_first_extent_buffer(tree, start);
293 BUG_ON(!eb || eb->start != start);
294 ret = write_tree_block(trans, root, eb);
297 clear_extent_buffer_dirty(eb);
298 free_extent_buffer(eb);
304 int btrfs_commit_transaction(struct btrfs_trans_handle *trans,
305 struct btrfs_root *root)
308 struct btrfs_root *new_root = NULL;
309 struct btrfs_fs_info *fs_info = root->fs_info;
311 if (root->commit_root == root->node)
314 new_root = malloc(sizeof(*new_root));
317 memcpy(new_root, root, sizeof(*new_root));
318 new_root->node = root->commit_root;
319 root->commit_root = NULL;
321 root->root_key.offset = trans->transid;
322 btrfs_set_root_bytenr(&root->root_item, root->node->start);
323 root->root_item.level = btrfs_header_level(root->node);
324 ret = btrfs_insert_root(trans, fs_info->tree_root,
325 &root->root_key, &root->root_item);
328 btrfs_set_root_refs(&new_root->root_item, 0);
329 ret = btrfs_update_root(trans, root->fs_info->tree_root,
330 &new_root->root_key, &new_root->root_item);
333 ret = commit_tree_roots(trans, fs_info);
335 ret = __commit_transaction(trans, root);
337 write_ctree_super(trans, root);
338 btrfs_finish_extent_commit(trans, fs_info->extent_root,
339 &fs_info->pinned_extents);
340 btrfs_free_transaction(root, trans);
341 fs_info->running_transaction = NULL;
343 trans = btrfs_start_transaction(root, 1);
344 ret = btrfs_drop_snapshot(trans, new_root);
346 ret = btrfs_del_root(trans, fs_info->tree_root, &new_root->root_key);
349 ret = commit_tree_roots(trans, fs_info);
351 ret = __commit_transaction(trans, root);
353 write_ctree_super(trans, root);
354 btrfs_finish_extent_commit(trans, fs_info->extent_root,
355 &fs_info->pinned_extents);
356 btrfs_free_transaction(root, trans);
357 free_extent_buffer(root->commit_root);
358 root->commit_root = NULL;
359 fs_info->running_transaction = NULL;
361 free_extent_buffer(new_root->node);
367 static int find_and_setup_root(struct btrfs_root *tree_root,
368 struct btrfs_fs_info *fs_info,
369 u64 objectid, struct btrfs_root *root)
374 __setup_root(tree_root->nodesize, tree_root->leafsize,
375 tree_root->sectorsize, tree_root->stripesize,
376 root, fs_info, objectid);
377 ret = btrfs_find_last_root(tree_root, objectid,
378 &root->root_item, &root->root_key);
381 blocksize = btrfs_level_size(root, btrfs_root_level(&root->root_item));
382 root->node = read_tree_block(root, btrfs_root_bytenr(&root->root_item),
388 int btrfs_free_fs_root(struct btrfs_fs_info *fs_info, struct btrfs_root *root)
391 free_extent_buffer(root->node);
392 if (root->commit_root)
393 free_extent_buffer(root->commit_root);
399 struct btrfs_root *btrfs_read_fs_root(struct btrfs_fs_info *fs_info,
400 struct btrfs_key *location)
402 struct btrfs_root *root;
403 struct btrfs_root *tree_root = fs_info->tree_root;
404 struct btrfs_path *path;
405 struct extent_buffer *l;
409 root = malloc(sizeof(*root));
411 return ERR_PTR(-ENOMEM);
412 memset(root, 0, sizeof(*root));
413 if (location->offset == (u64)-1) {
414 ret = find_and_setup_root(tree_root, fs_info,
415 location->objectid, root);
423 __setup_root(tree_root->nodesize, tree_root->leafsize,
424 tree_root->sectorsize, tree_root->stripesize,
425 root, fs_info, location->objectid);
427 path = btrfs_alloc_path();
429 ret = btrfs_search_slot(NULL, tree_root, location, path, 0, 0);
436 read_extent_buffer(l, &root->root_item,
437 btrfs_item_ptr_offset(l, path->slots[0]),
438 sizeof(root->root_item));
439 memcpy(&root->root_key, location, sizeof(*location));
442 btrfs_release_path(root, path);
443 btrfs_free_path(path);
448 blocksize = btrfs_level_size(root, btrfs_root_level(&root->root_item));
449 root->node = read_tree_block(root, btrfs_root_bytenr(&root->root_item),
457 struct btrfs_root *open_ctree(const char *filename, u64 sb_bytenr)
461 fp = open(filename, O_CREAT | O_RDWR, 0600);
465 return open_ctree_fd(fp, filename, sb_bytenr);
468 struct btrfs_root *open_ctree_fd(int fp, const char *path, u64 sb_bytenr)
475 struct btrfs_root *root = malloc(sizeof(struct btrfs_root));
476 struct btrfs_root *tree_root = malloc(sizeof(struct btrfs_root));
477 struct btrfs_root *extent_root = malloc(sizeof(struct btrfs_root));
478 struct btrfs_root *chunk_root = malloc(sizeof(struct btrfs_root));
479 struct btrfs_root *dev_root = malloc(sizeof(struct btrfs_root));
480 struct btrfs_fs_info *fs_info = malloc(sizeof(*fs_info));
482 struct btrfs_super_block *disk_super;
483 struct btrfs_fs_devices *fs_devices = NULL;
487 sb_bytenr = BTRFS_SUPER_INFO_OFFSET;
489 ret = btrfs_scan_one_device(fp, path, &fs_devices,
490 &total_devs, sb_bytenr);
493 fprintf(stderr, "No valid Btrfs found on %s\n", path);
496 fprintf(stderr, "found Btrfs on %s with %lu devices\n", path,
497 (unsigned long)total_devs);
499 if (total_devs != 1) {
500 ret = btrfs_scan_for_fsid(fs_devices, total_devs, 1);
504 memset(fs_info, 0, sizeof(*fs_info));
505 fs_info->fp = fs_devices->lowest_bdev;
506 fs_info->fs_root = root;
507 fs_info->tree_root = tree_root;
508 fs_info->extent_root = extent_root;
509 fs_info->chunk_root = chunk_root;
510 fs_info->dev_root = dev_root;
512 extent_io_tree_init(&fs_info->extent_cache);
513 extent_io_tree_init(&fs_info->free_space_cache);
514 extent_io_tree_init(&fs_info->block_group_cache);
515 extent_io_tree_init(&fs_info->pinned_extents);
516 extent_io_tree_init(&fs_info->pending_del);
517 extent_io_tree_init(&fs_info->extent_ins);
519 cache_tree_init(&fs_info->mapping_tree.cache_tree);
521 mutex_init(&fs_info->fs_mutex);
522 fs_info->fs_devices = fs_devices;
523 INIT_LIST_HEAD(&fs_info->dirty_cowonly_roots);
524 INIT_LIST_HEAD(&fs_info->space_info);
526 __setup_root(4096, 4096, 4096, 4096, tree_root,
527 fs_info, BTRFS_ROOT_TREE_OBJECTID);
529 ret = btrfs_open_devices(fs_devices, O_RDWR);
532 ret = btrfs_bootstrap_super_map(&fs_info->mapping_tree, fs_devices);
534 fs_info->sb_buffer = btrfs_find_create_tree_block(tree_root, sb_bytenr,
536 BUG_ON(!fs_info->sb_buffer);
537 fs_info->sb_buffer->fd = fs_devices->latest_bdev;
538 fs_info->sb_buffer->dev_bytenr = sb_bytenr;
539 ret = read_extent_from_disk(fs_info->sb_buffer);
541 btrfs_set_buffer_uptodate(fs_info->sb_buffer);
543 read_extent_buffer(fs_info->sb_buffer, &fs_info->super_copy, 0,
544 sizeof(fs_info->super_copy));
545 read_extent_buffer(fs_info->sb_buffer, fs_info->fsid,
546 (unsigned long)btrfs_super_fsid(fs_info->sb_buffer),
549 disk_super = &fs_info->super_copy;
550 if (strncmp((char *)(&disk_super->magic), BTRFS_MAGIC,
551 sizeof(disk_super->magic))) {
552 printk("No valid btrfs found\n");
555 nodesize = btrfs_super_nodesize(disk_super);
556 leafsize = btrfs_super_leafsize(disk_super);
557 sectorsize = btrfs_super_sectorsize(disk_super);
558 stripesize = btrfs_super_stripesize(disk_super);
559 tree_root->nodesize = nodesize;
560 tree_root->leafsize = leafsize;
561 tree_root->sectorsize = sectorsize;
562 tree_root->stripesize = stripesize;
564 ret = btrfs_read_super_device(tree_root, fs_info->sb_buffer);
566 ret = btrfs_read_sys_array(tree_root);
568 blocksize = btrfs_level_size(tree_root,
569 btrfs_super_chunk_root_level(disk_super));
571 __setup_root(nodesize, leafsize, sectorsize, stripesize,
572 chunk_root, fs_info, BTRFS_CHUNK_TREE_OBJECTID);
574 chunk_root->node = read_tree_block(chunk_root,
575 btrfs_super_chunk_root(disk_super),
578 BUG_ON(!chunk_root->node);
580 read_extent_buffer(chunk_root->node, fs_info->chunk_tree_uuid,
581 (unsigned long)btrfs_header_chunk_tree_uuid(chunk_root->node),
584 ret = btrfs_read_chunk_tree(chunk_root);
587 blocksize = btrfs_level_size(tree_root,
588 btrfs_super_root_level(disk_super));
590 tree_root->node = read_tree_block(tree_root,
591 btrfs_super_root(disk_super),
593 BUG_ON(!tree_root->node);
594 ret = find_and_setup_root(tree_root, fs_info,
595 BTRFS_EXTENT_TREE_OBJECTID, extent_root);
597 extent_root->track_dirty = 1;
599 ret = find_and_setup_root(tree_root, fs_info,
600 BTRFS_DEV_TREE_OBJECTID, dev_root);
602 dev_root->track_dirty = 1;
604 ret = find_and_setup_root(tree_root, fs_info,
605 BTRFS_FS_TREE_OBJECTID, root);
608 fs_info->generation = btrfs_super_generation(disk_super) + 1;
609 btrfs_read_block_groups(root);
611 fs_info->data_alloc_profile = (u64)-1;
612 fs_info->metadata_alloc_profile = (u64)-1;
613 fs_info->system_alloc_profile = fs_info->metadata_alloc_profile;
618 int write_all_supers(struct btrfs_root *root)
620 struct list_head *cur;
621 struct list_head *head = &root->fs_info->fs_devices->devices;
622 struct btrfs_device *dev;
623 struct extent_buffer *sb;
624 struct btrfs_dev_item *dev_item;
627 sb = root->fs_info->sb_buffer;
628 dev_item = (struct btrfs_dev_item *)offsetof(struct btrfs_super_block,
630 list_for_each(cur, head) {
631 dev = list_entry(cur, struct btrfs_device, dev_list);
632 btrfs_set_device_type(sb, dev_item, dev->type);
633 btrfs_set_device_id(sb, dev_item, dev->devid);
634 btrfs_set_device_total_bytes(sb, dev_item, dev->total_bytes);
635 btrfs_set_device_bytes_used(sb, dev_item, dev->bytes_used);
636 btrfs_set_device_io_align(sb, dev_item, dev->io_align);
637 btrfs_set_device_io_width(sb, dev_item, dev->io_width);
638 btrfs_set_device_sector_size(sb, dev_item, dev->sector_size);
639 write_extent_buffer(sb, dev->uuid,
640 (unsigned long)btrfs_device_uuid(dev_item),
643 sb->dev_bytenr = BTRFS_SUPER_INFO_OFFSET;
644 btrfs_set_header_flag(sb, BTRFS_HEADER_FLAG_WRITTEN);
645 csum_tree_block(root, sb, 0);
646 ret = write_extent_to_disk(sb);
652 int write_ctree_super(struct btrfs_trans_handle *trans,
653 struct btrfs_root *root)
656 struct btrfs_root *tree_root = root->fs_info->tree_root;
657 struct btrfs_root *chunk_root = root->fs_info->chunk_root;
658 btrfs_set_super_generation(&root->fs_info->super_copy,
660 btrfs_set_super_root(&root->fs_info->super_copy,
661 tree_root->node->start);
662 btrfs_set_super_root_level(&root->fs_info->super_copy,
663 btrfs_header_level(tree_root->node));
664 btrfs_set_super_chunk_root(&root->fs_info->super_copy,
665 chunk_root->node->start);
666 btrfs_set_super_chunk_root_level(&root->fs_info->super_copy,
667 btrfs_header_level(chunk_root->node));
668 write_extent_buffer(root->fs_info->sb_buffer,
669 &root->fs_info->super_copy, 0,
670 sizeof(root->fs_info->super_copy));
671 ret = write_all_supers(root);
673 fprintf(stderr, "failed to write new super block err %d\n", ret);
677 static int close_all_devices(struct btrfs_fs_info *fs_info)
679 struct list_head *list;
680 struct list_head *next;
681 struct btrfs_device *device;
685 list = &fs_info->fs_devices->devices;
686 list_for_each(next, list) {
687 device = list_entry(next, struct btrfs_device, dev_list);
688 // close(device->fd);
693 int close_ctree(struct btrfs_root *root)
696 struct btrfs_trans_handle *trans;
697 struct btrfs_fs_info *fs_info = root->fs_info;
699 trans = btrfs_start_transaction(root, 1);
700 btrfs_commit_transaction(trans, root);
701 trans = btrfs_start_transaction(root, 1);
702 ret = commit_tree_roots(trans, root->fs_info);
704 ret = __commit_transaction(trans, root);
706 write_ctree_super(trans, root);
707 btrfs_free_transaction(root, trans);
708 btrfs_free_block_groups(root->fs_info);
709 close(root->fs_info->fp);
711 free_extent_buffer(root->node);
712 if (root->fs_info->extent_root->node)
713 free_extent_buffer(root->fs_info->extent_root->node);
714 if (root->fs_info->tree_root->node)
715 free_extent_buffer(root->fs_info->tree_root->node);
716 free_extent_buffer(root->commit_root);
717 free_extent_buffer(root->fs_info->sb_buffer);
719 if (root->fs_info->chunk_root->node);
720 free_extent_buffer(root->fs_info->chunk_root->node);
722 if (root->fs_info->dev_root->node);
723 free_extent_buffer(root->fs_info->dev_root->node);
725 close_all_devices(root->fs_info);
726 extent_io_tree_cleanup(&fs_info->extent_cache);
727 extent_io_tree_cleanup(&fs_info->free_space_cache);
728 extent_io_tree_cleanup(&fs_info->block_group_cache);
729 extent_io_tree_cleanup(&fs_info->pinned_extents);
730 extent_io_tree_cleanup(&fs_info->pending_del);
731 extent_io_tree_cleanup(&fs_info->extent_ins);
733 free(fs_info->tree_root);
734 free(fs_info->extent_root);
735 free(fs_info->fs_root);
736 free(fs_info->chunk_root);
737 free(fs_info->dev_root);
743 int clean_tree_block(struct btrfs_trans_handle *trans, struct btrfs_root *root,
744 struct extent_buffer *eb)
746 return clear_extent_buffer_dirty(eb);
749 int wait_on_tree_block_writeback(struct btrfs_root *root,
750 struct extent_buffer *eb)
755 void btrfs_mark_buffer_dirty(struct extent_buffer *eb)
757 set_extent_buffer_dirty(eb);
760 int btrfs_buffer_uptodate(struct extent_buffer *eb)
762 return extent_buffer_uptodate(eb);
765 int btrfs_set_buffer_uptodate(struct extent_buffer *eb)
767 return set_extent_buffer_uptodate(eb);