diff options
Diffstat (limited to 'c_src/cmd_dump.c')
-rw-r--r-- | c_src/cmd_dump.c | 372 |
1 files changed, 285 insertions, 87 deletions
diff --git a/c_src/cmd_dump.c b/c_src/cmd_dump.c index eb338858..08051802 100644 --- a/c_src/cmd_dump.c +++ b/c_src/cmd_dump.c @@ -14,71 +14,216 @@ #include "libbcachefs/btree_iter.h" #include "libbcachefs/error.h" #include "libbcachefs/extents.h" +#include "libbcachefs/journal_io.h" #include "libbcachefs/sb-members.h" #include "libbcachefs/super.h" -static void dump_usage(void) -{ - puts("bcachefs dump - dump filesystem metadata\n" - "Usage: bcachefs dump [OPTION]... <devices>\n" - "\n" - "Options:\n" - " -o output Output qcow2 image(s)\n" - " -f, --force Force; overwrite when needed\n" - " --nojournal Don't dump entire journal, just dirty entries\n" - " --noexcl Open devices with O_NOEXCL (not recommended)\n" - " -h, --help Display this help and exit\n" - "Report bugs to <linux-bcachefs@vger.kernel.org>"); -} +struct dump_dev { + ranges sb, journal, btree; +}; +typedef DARRAY(struct dump_dev) dump_devs; -static void dump_node(struct bch_fs *c, struct bch_dev *ca, struct bkey_s_c k, ranges *data) +static void dump_node(struct bch_fs *c, dump_devs *devs, struct bkey_s_c k) { struct bkey_ptrs_c ptrs = bch2_bkey_ptrs_c(k); + unsigned bytes = btree_ptr_sectors_written(k) << 9 ?: c->opts.btree_node_size; bkey_for_each_ptr(ptrs, ptr) - if (ptr->dev == ca->dev_idx) - range_add(data, ptr->offset << 9, c->opts.btree_node_size); + range_add(&devs->data[ptr->dev].btree, + ptr->offset << 9, bytes); } -static void dump_one_device(struct bch_fs *c, struct bch_dev *ca, int fd, - bool entire_journal) +static void get_sb_journal(struct bch_fs *c, struct bch_dev *ca, + bool entire_journal, + struct dump_dev *d) { struct bch_sb *sb = ca->disk_sb.sb; - ranges data = { 0 }; - unsigned i; - int ret; /* Superblock: */ - range_add(&data, BCH_SB_LAYOUT_SECTOR << 9, + range_add(&d->sb, BCH_SB_LAYOUT_SECTOR << 9, sizeof(struct bch_sb_layout)); - for (i = 0; i < sb->layout.nr_superblocks; i++) - range_add(&data, + for (unsigned i = 0; i < sb->layout.nr_superblocks; i++) + range_add(&d->sb, le64_to_cpu(sb->layout.sb_offset[i]) << 9, vstruct_bytes(sb)); /* Journal: */ - for (i = 0; i < ca->journal.nr; i++) + for (unsigned i = 0; i < ca->journal.nr; i++) if (entire_journal || ca->journal.bucket_seq[i] >= c->journal.last_seq_ondisk) { u64 bucket = ca->journal.buckets[i]; - range_add(&data, + range_add(&d->journal, bucket_bytes(ca) * bucket, bucket_bytes(ca)); } +} + +struct dump_opts { + char *out; + bool force; + bool sanitize; + bool entire_journal; + bool noexcl; +}; + +static void sanitize_key(struct bkey_packed *k, struct bkey_format *f, void *end, + bool *modified) +{ + struct bch_val *v = bkeyp_val(f, k); + unsigned len = min_t(unsigned, end - (void *) v, bkeyp_val_bytes(f, k)); + + switch (k->type) { + case KEY_TYPE_inline_data: { + struct bch_inline_data *d = container_of(v, struct bch_inline_data, v); + + memset(&d->data[0], 0, len - offsetof(struct bch_inline_data, data)); + *modified = true; + break; + } + case KEY_TYPE_indirect_inline_data: { + struct bch_indirect_inline_data *d = container_of(v, struct bch_indirect_inline_data, v); + + memset(&d->data[0], 0, len - offsetof(struct bch_indirect_inline_data, data)); + *modified = true; + break; + } + } +} + +static void sanitize_journal(struct bch_fs *c, void *buf, size_t len) +{ + struct bkey_format f = BKEY_FORMAT_CURRENT; + void *end = buf + len; + + while (len) { + struct jset *j = buf; + bool modified = false; + + if (le64_to_cpu(j->magic) != jset_magic(c)) + break; + + vstruct_for_each(j, i) { + if ((void *) i >= end) + break; + + if (!jset_entry_is_key(i)) + continue; + + jset_entry_for_each_key(i, k) { + if ((void *) k >= end) + break; + if (!k->k.u64s) + break; + sanitize_key(bkey_to_packed(k), &f, end, &modified); + } + } + + if (modified) { + memset(&j->csum, 0, sizeof(j->csum)); + SET_JSET_CSUM_TYPE(j, 0); + } + + unsigned b = min(len, vstruct_sectors(j, c->block_bits) << 9); + len -= b; + buf += b; + } +} + +static void sanitize_btree(struct bch_fs *c, void *buf, size_t len) +{ + void *end = buf + len; + bool first = true; + struct bkey_format f_current = BKEY_FORMAT_CURRENT; + struct bkey_format f; + u64 seq; + + while (len) { + unsigned sectors; + struct bset *i; + bool modified = false; + + if (first) { + struct btree_node *bn = buf; + + if (le64_to_cpu(bn->magic) != bset_magic(c)) + break; + + i = &bn->keys; + seq = bn->keys.seq; + f = bn->format; + + sectors = vstruct_sectors(bn, c->block_bits); + } else { + struct btree_node_entry *bne = buf; + + if (bne->keys.seq != seq) + break; + + i = &bne->keys; + sectors = vstruct_sectors(bne, c->block_bits); + } + + vstruct_for_each(i, k) { + if ((void *) k >= end) + break; + if (!k->u64s) + break; + + sanitize_key(k, bkey_packed(k) ? &f : &f_current, end, &modified); + } + + if (modified) { + if (first) { + struct btree_node *bn = buf; + memset(&bn->csum, 0, sizeof(bn->csum)); + } else { + struct btree_node_entry *bne = buf; + memset(&bne->csum, 0, sizeof(bne->csum)); + } + SET_BSET_CSUM_TYPE(i, 0); + } + + first = false; + + unsigned b = min(len, sectors << 9); + len -= b; + buf += b; + } +} + +static int dump_fs(struct bch_fs *c, struct dump_opts opts) +{ + if (opts.sanitize) + printf("Sanitizing inline data extents\n"); + + dump_devs devs = {}; + while (devs.nr < c->sb.nr_devices) + darray_push(&devs, (struct dump_dev) {}); + + down_read(&c->state_lock); + + unsigned nr_online = 0; + for_each_online_member(c, ca, 0) { + if (opts.sanitize && ca->mi.bucket_size % block_sectors(c)) + die("%s has unaligned buckets, cannot sanitize", ca->name); + + get_sb_journal(c, ca, opts.entire_journal, &devs.data[ca->dev_idx]); + nr_online++; + } - /* Btree: */ - for (i = 0; i < BTREE_ID_NR; i++) { - struct btree_trans *trans = bch2_trans_get(c); + bch_verbose(c, "walking metadata to dump"); + for (unsigned i = 0; i < BTREE_ID_NR; i++) { + CLASS(btree_trans, trans)(c); - ret = __for_each_btree_node(trans, iter, i, POS_MIN, 0, 1, 0, b, ({ + int ret = __for_each_btree_node(trans, iter, i, POS_MIN, 0, 1, 0, b, ({ struct btree_node_iter iter; struct bkey u; struct bkey_s_c k; for_each_btree_node_key_unpack(b, k, &iter, &u) - dump_node(c, ca, k, &data); + dump_node(c, &devs, k); 0; })); @@ -87,57 +232,135 @@ static void dump_one_device(struct bch_fs *c, struct bch_dev *ca, int fd, struct btree *b = bch2_btree_id_root(c, i)->b; if (!btree_node_fake(b)) - dump_node(c, ca, bkey_i_to_s_c(&b->key), &data); + dump_node(c, &devs, bkey_i_to_s_c(&b->key)); + } + + bch_verbose(c, "writing metadata image(s)"); + for_each_online_member(c, ca, 0) { + int flags = O_WRONLY|O_CREAT|O_TRUNC; + + if (!opts.force) + flags |= O_EXCL; + + char *path = nr_online > 1 + ? mprintf("%s.%u.qcow2", opts.out, ca->dev_idx) + : mprintf("%s.qcow2", opts.out); + int fd = xopen(path, flags, 0600); + free(path); + + struct qcow2_image img; + qcow2_image_init(&img, ca->disk_sb.bdev->bd_fd, fd, c->opts.block_size); + + struct dump_dev *d = &devs.data[ca->dev_idx]; + + qcow2_write_ranges(&img, &d->sb); + + if (!opts.sanitize) { + qcow2_write_ranges(&img, &d->journal); + qcow2_write_ranges(&img, &d->btree); + } else { + ranges_sort(&d->journal); + ranges_sort(&d->btree); + + u64 bucket_bytes = ca->mi.bucket_size << 9; + char *buf = xmalloc(bucket_bytes); - bch2_trans_put(trans); + darray_for_each(d->journal, r) { + u64 len = r->end - r->start; + BUG_ON(len > bucket_bytes); + + xpread(img.infd, buf, len, r->start); + sanitize_journal(c, buf, len); + qcow2_write_buf(&img, buf, len, r->start); + } + + darray_for_each(d->btree, r) { + u64 len = r->end - r->start; + BUG_ON(len > bucket_bytes); + + xpread(img.infd, buf, len, r->start); + sanitize_btree(c, buf, len); + qcow2_write_buf(&img, buf, len, r->start); + } + free(buf); + } + + qcow2_image_finish(&img); + xclose(fd); } - qcow2_write_image(ca->disk_sb.bdev->bd_fd, fd, &data, - max_t(unsigned, c->opts.btree_node_size / 8, block_bytes(c))); - darray_exit(&data); + up_read(&c->state_lock); + + bch2_fs_stop(c); + + darray_for_each(devs, d) { + darray_exit(&d->sb); + darray_exit(&d->journal); + darray_exit(&d->btree); + } + darray_exit(&devs); + return 0; +} + +static void dump_usage(void) +{ + puts("bcachefs dump - dump filesystem metadata\n" + "Usage: bcachefs dump [OPTION]... <devices>\n" + "\n" + "Options:\n" + " -o output Output qcow2 image(s)\n" + " -f, --force Force; overwrite when needed\n" + " -s, --sanitize Zero out inline data extents\n" + " --nojournal Don't dump entire journal, just dirty entries\n" + " --noexcl Open devices with O_NOEXCL (not recommended)\n" + " -v, --verbose\n" + " -h, --help Display this help and exit\n" + "Report bugs to <linux-bcachefs@vger.kernel.org>"); } int cmd_dump(int argc, char *argv[]) { static const struct option longopts[] = { { "force", no_argument, NULL, 'f' }, + { "sanitize", no_argument, NULL, 's' }, { "nojournal", no_argument, NULL, 'j' }, { "noexcl", no_argument, NULL, 'e' }, { "verbose", no_argument, NULL, 'v' }, { "help", no_argument, NULL, 'h' }, { NULL } }; - struct bch_opts opts = bch2_opts_empty(); - char *out = NULL; - unsigned nr_devices = 0; - bool force = false, entire_journal = true; - int fd, opt; - - opt_set(opts, direct_io, false); - opt_set(opts, read_only, true); - opt_set(opts, nochanges, true); - opt_set(opts, norecovery, true); - opt_set(opts, degraded, BCH_DEGRADED_very); - opt_set(opts, errors, BCH_ON_ERROR_continue); - opt_set(opts, fix_errors, FSCK_FIX_no); - - while ((opt = getopt_long(argc, argv, "o:fvh", + struct bch_opts fs_opts = bch2_opts_empty(); + struct dump_opts opts = { .entire_journal = true }; + int opt; + + opt_set(fs_opts, direct_io, false); + opt_set(fs_opts, read_only, true); + opt_set(fs_opts, nochanges, true); + opt_set(fs_opts, norecovery, true); + opt_set(fs_opts, degraded, BCH_DEGRADED_very); + opt_set(fs_opts, errors, BCH_ON_ERROR_continue); + opt_set(fs_opts, fix_errors, FSCK_FIX_no); + + while ((opt = getopt_long(argc, argv, "o:fsvh", longopts, NULL)) != -1) switch (opt) { case 'o': - out = optarg; + opts.out = optarg; break; case 'f': - force = true; + opts.force = true; + break; + case 's': + opts.sanitize = true; break; case 'j': - entire_journal = false; + opts.entire_journal = false; break; case 'e': - opt_set(opts, noexcl, true); + opt_set(fs_opts, noexcl, true); break; case 'v': - opt_set(opts, verbose, true); + opt_set(fs_opts, verbose, true); break; case 'h': dump_usage(); @@ -145,44 +368,19 @@ int cmd_dump(int argc, char *argv[]) } args_shift(optind); - if (!out) + if (!opts.out) die("Please supply output filename"); if (!argc) die("Please supply device(s) to check"); - darray_const_str devs = get_or_split_cmdline_devs(argc, argv); + darray_const_str dev_names = get_or_split_cmdline_devs(argc, argv); - struct bch_fs *c = bch2_fs_open(&devs, &opts); + struct bch_fs *c = bch2_fs_open(&dev_names, &fs_opts); if (IS_ERR(c)) die("error opening devices: %s", bch2_err_str(PTR_ERR(c))); - down_read(&c->state_lock); - - for_each_online_member(c, ca, 0) - nr_devices++; - - BUG_ON(!nr_devices); - - for_each_online_member(c, ca, 0) { - int flags = O_WRONLY|O_CREAT|O_TRUNC; - - if (!force) - flags |= O_EXCL; - - char *path = nr_devices > 1 - ? mprintf("%s.%u.qcow2", out, ca->dev_idx) - : mprintf("%s.qcow2", out); - fd = xopen(path, flags, 0600); - free(path); - - dump_one_device(c, ca, fd, entire_journal); - xclose(fd); - } - - up_read(&c->state_lock); - - bch2_fs_stop(c); - darray_exit(&devs); - return 0; + int ret = dump_fs(c, opts); + darray_exit(&dev_names); + return ret; } |