bcachefs: Verify fs hasn't been modified before going rw

author Kent Overstreet <kent.overstreet@gmail.com>

Fri, 22 Mar 2019 03:13:46 +0000 (23:13 -0400)

committer Kent Overstreet <kent.overstreet@linux.dev>

Sun, 22 Oct 2023 21:08:18 +0000 (17:08 -0400)
author Kent Overstreet <kent.overstreet@gmail.com>
Fri, 22 Mar 2019 03:13:46 +0000 (23:13 -0400)
committer Kent Overstreet <kent.overstreet@linux.dev>
Sun, 22 Oct 2023 21:08:18 +0000 (17:08 -0400)
diff --git a/fs/bcachefs/bcachefs.h b/fs/bcachefs/bcachefs.h

index 5eae18e92bd5bc781dce8dbda499a3782800d112..a815d7a488a6b5662b8be25cdf03c5fd70c8a6f2 100644 (file)
--- a/fs/bcachefs/bcachefs.h
+++ b/fs/bcachefs/bcachefs.h
@@ -390,6 +390,7 @@ struct bch_dev {
         char                    name[BDEVNAME_SIZE];
  
         struct bch_sb_handle    disk_sb;
+       struct bch_sb           *sb_read_scratch;
         int                     sb_write_error;
  
         struct bch_devs_mask    self;
diff --git a/fs/bcachefs/fs.c b/fs/bcachefs/fs.c

index 2f01d97470b19aa47281e590e4350092cffc2559..2a5a90b2a78179b81a1c85c982613265acc8e21d 100644 (file)
--- a/fs/bcachefs/fs.c
+++ b/fs/bcachefs/fs.c
@@ -1682,6 +1682,7 @@ static int bch2_remount(struct super_block *sb, int *flags, char *data)
                         ret = bch2_fs_read_write(c);
                         if (ret) {
                                 bch_err(c, "error going rw: %i", ret);
+                               mutex_unlock(&c->state_lock);
                                 return -EINVAL;
                         }
  
diff --git a/fs/bcachefs/recovery.c b/fs/bcachefs/recovery.c

index f7e3060428cf857fff6bfb38bbeec1d852abd28a..93c4d5887e8bfa5e44bb5eabbac0cebf609c87fa 100644 (file)
--- a/fs/bcachefs/recovery.c
+++ b/fs/bcachefs/recovery.c
@@ -107,10 +107,11 @@ static int journal_replay_entry_early(struct bch_fs *c,
  }
  
  static int verify_superblock_clean(struct bch_fs *c,
-                                  struct bch_sb_field_clean *clean,
+                                  struct bch_sb_field_clean **cleanp,
                                    struct jset *j)
  {
         unsigned i;
+       struct bch_sb_field_clean *clean = *cleanp;
         int ret = 0;
  
         if (!clean || !j)
@@ -120,11 +121,9 @@ static int verify_superblock_clean(struct bch_fs *c,
                         "superblock journal seq (%llu) doesn't match journal (%llu) after clean shutdown",
                         le64_to_cpu(clean->journal_seq),
                         le64_to_cpu(j->seq))) {
-               ret = bch2_fs_mark_dirty(c);
-               if (ret) {
-                       bch_err(c, "error going rw");
-                       return ret;
-               }
+               kfree(clean);
+               *cleanp = NULL;
+               return 0;
         }
  
         mustfix_fsck_err_on(j->read_clock != clean->read_clock, c,
@@ -236,7 +235,7 @@ int bch2_fs_recovery(struct bch_fs *c)
                 BUG_ON(ret);
         }
  
-       ret = verify_superblock_clean(c, clean, j);
+       ret = verify_superblock_clean(c, &clean, j);
         if (ret)
                 goto err;
  
@@ -430,7 +429,7 @@ int bch2_fs_initialize(struct bch_fs *c)
         bch2_journal_set_replay_done(&c->journal);
  
         err = "error going read write";
-       ret = bch2_fs_read_write_early(c);
+       ret = __bch2_fs_read_write(c, true);
         if (ret)
                 goto err;
  
diff --git a/fs/bcachefs/super-io.c b/fs/bcachefs/super-io.c

index dec6a737f44f2dd464a142b78a645eda35759bd5..f504743fff4deb04ad5d06691321d6cc90ea1b31 100644 (file)
--- a/fs/bcachefs/super-io.c
+++ b/fs/bcachefs/super-io.c
@@ -509,6 +509,8 @@ reread:
         if (bch2_crc_cmp(csum, sb->sb->csum))
                 return "bad checksum reading superblock";
  
+       sb->seq = le64_to_cpu(sb->sb->seq);
+
         return NULL;
  }
  
@@ -642,6 +644,25 @@ static void write_super_endio(struct bio *bio)
         percpu_ref_put(&ca->io_ref);
  }
  
+static void read_back_super(struct bch_fs *c, struct bch_dev *ca)
+{
+       struct bch_sb *sb = ca->disk_sb.sb;
+       struct bio *bio = ca->disk_sb.bio;
+
+       bio_reset(bio, ca->disk_sb.bdev, REQ_OP_READ|REQ_SYNC|REQ_META);
+       bio->bi_iter.bi_sector  = le64_to_cpu(sb->layout.sb_offset[0]);
+       bio->bi_iter.bi_size    = 4096;
+       bio->bi_end_io          = write_super_endio;
+       bio->bi_private         = ca;
+       bch2_bio_map(bio, ca->sb_read_scratch);
+
+       this_cpu_add(ca->io_done->sectors[READ][BCH_DATA_SB],
+                    bio_sectors(bio));
+
+       percpu_ref_get(&ca->io_ref);
+       closure_bio_submit(bio, &c->sb_write);
+}
+
  static void write_one_super(struct bch_fs *c, struct bch_dev *ca, unsigned idx)
  {
         struct bch_sb *sb = ca->disk_sb.sb;
@@ -669,7 +690,7 @@ static void write_one_super(struct bch_fs *c, struct bch_dev *ca, unsigned idx)
         closure_bio_submit(bio, &c->sb_write);
  }
  
-void bch2_write_super(struct bch_fs *c)
+int bch2_write_super(struct bch_fs *c)
  {
         struct closure *cl = &c->sb_write;
         struct bch_dev *ca;
@@ -677,6 +698,7 @@ void bch2_write_super(struct bch_fs *c)
         const char *err;
         struct bch_devs_mask sb_written;
         bool wrote, can_mount_without_written, can_mount_with_written;
+       int ret = 0;
  
         lockdep_assert_held(&c->sb_lock);
  
@@ -692,6 +714,7 @@ void bch2_write_super(struct bch_fs *c)
                 err = bch2_sb_validate(&ca->disk_sb);
                 if (err) {
                         bch2_fs_inconsistent(c, "sb invalid before write: %s", err);
+                       ret = -1;
                         goto out;
                 }
         }
@@ -705,10 +728,27 @@ void bch2_write_super(struct bch_fs *c)
                 ca->sb_write_error = 0;
         }
  
+       for_each_online_member(ca, c, i)
+               read_back_super(c, ca);
+       closure_sync(cl);
+
+       for_each_online_member(ca, c, i) {
+               if (!ca->sb_write_error &&
+                   ca->disk_sb.seq !=
+                   le64_to_cpu(ca->sb_read_scratch->seq)) {
+                       bch2_fs_fatal_error(c,
+                               "Superblock modified by another process");
+                       percpu_ref_put(&ca->io_ref);
+                       ret = -EROFS;
+                       goto out;
+               }
+       }
+
         do {
                 wrote = false;
                 for_each_online_member(ca, c, i)
-                       if (sb < ca->disk_sb.sb->layout.nr_superblocks) {
+                       if (!ca->sb_write_error &&
+                           sb < ca->disk_sb.sb->layout.nr_superblocks) {
                                 write_one_super(c, ca, sb);
                                 wrote = true;
                         }
@@ -716,9 +756,12 @@ void bch2_write_super(struct bch_fs *c)
                 sb++;
         } while (wrote);
  
-       for_each_online_member(ca, c, i)
+       for_each_online_member(ca, c, i) {
                 if (ca->sb_write_error)
                         __clear_bit(ca->dev_idx, sb_written.d);
+               else
+                       ca->disk_sb.seq = le64_to_cpu(ca->disk_sb.sb->seq);
+       }
  
         nr_wrote = dev_mask_nr(&sb_written);
  
@@ -741,13 +784,15 @@ void bch2_write_super(struct bch_fs *c)
          * written anything (new filesystem), we continue if we'd be able to
          * mount with the devices we did successfully write to:
          */
-       bch2_fs_fatal_err_on(!nr_wrote ||
-                            (can_mount_without_written &&
-                             !can_mount_with_written), c,
-               "Unable to write superblock to sufficient devices");
+       if (bch2_fs_fatal_err_on(!nr_wrote ||
+                                (can_mount_without_written &&
+                                 !can_mount_with_written), c,
+               "Unable to write superblock to sufficient devices"))
+               ret = -1;
  out:
         /* Make new options visible after they're persistent: */
         bch2_sb_update(c);
+       return ret;
  }
  
  /* BCH_SB_FIELD_journal: */
@@ -888,16 +933,20 @@ void bch2_sb_clean_renumber(struct bch_sb_field_clean *clean, int write)
  
  int bch2_fs_mark_dirty(struct bch_fs *c)
  {
+       int ret;
+
+       /*
+        * Unconditionally write superblock, to verify it hasn't changed before
+        * we go rw:
+        */
+
         mutex_lock(&c->sb_lock);
-       if (BCH_SB_CLEAN(c->disk_sb.sb) ||
-           (c->disk_sb.sb->compat[0] & (1ULL << BCH_COMPAT_FEAT_ALLOC_INFO))) {
-               SET_BCH_SB_CLEAN(c->disk_sb.sb, false);
-               c->disk_sb.sb->compat[0] &= ~(1ULL << BCH_COMPAT_FEAT_ALLOC_INFO);
-               bch2_write_super(c);
-       }
+       SET_BCH_SB_CLEAN(c->disk_sb.sb, false);
+       c->disk_sb.sb->compat[0] &= ~(1ULL << BCH_COMPAT_FEAT_ALLOC_INFO);
+       ret = bch2_write_super(c);
         mutex_unlock(&c->sb_lock);
  
-       return 0;
+       return ret;
  }
  
  struct jset_entry *
diff --git a/fs/bcachefs/super-io.h b/fs/bcachefs/super-io.h

index afc92d14c25490b8151695d618a9579c1f4f9867..31b8b8307ac3334c2d3f883727138cda788a7605 100644 (file)
--- a/fs/bcachefs/super-io.h
+++ b/fs/bcachefs/super-io.h
@@ -89,7 +89,7 @@ int bch2_sb_realloc(struct bch_sb_handle *, unsigned);
  const char *bch2_sb_validate(struct bch_sb_handle *);
  
  int bch2_read_super(const char *, struct bch_opts *, struct bch_sb_handle *);
-void bch2_write_super(struct bch_fs *);
+int bch2_write_super(struct bch_fs *);
  
  /* BCH_SB_FIELD_journal: */
  
diff --git a/fs/bcachefs/super.c b/fs/bcachefs/super.c

index 5364b95cfec90249cb48fcd985baf36572b09997..dd1496af9a06ba1008f328e0daf30842ff8b3dac 100644 (file)
--- a/fs/bcachefs/super.c
+++ b/fs/bcachefs/super.c
@@ -366,7 +366,7 @@ static int bch2_fs_read_write_late(struct bch_fs *c)
         return 0;
  }
  
-static int __bch2_fs_read_write(struct bch_fs *c, bool early)
+int __bch2_fs_read_write(struct bch_fs *c, bool early)
  {
         struct bch_dev *ca;
         unsigned i;
@@ -907,6 +907,7 @@ static void bch2_dev_free(struct bch_dev *ca)
         free_percpu(ca->io_done);
         bioset_exit(&ca->replica_set);
         bch2_dev_buckets_free(ca);
+       kfree(ca->sb_read_scratch);
  
         bch2_time_stats_exit(&ca->io_latency[WRITE]);
         bch2_time_stats_exit(&ca->io_latency[READ]);
@@ -1017,6 +1018,7 @@ static struct bch_dev *__bch2_dev_alloc(struct bch_fs *c,
                             0, GFP_KERNEL) ||
             percpu_ref_init(&ca->io_ref, bch2_dev_io_ref_complete,
                             PERCPU_REF_INIT_DEAD, GFP_KERNEL) ||
+           !(ca->sb_read_scratch = kmalloc(4096, GFP_KERNEL)) ||
             bch2_dev_buckets_alloc(c, ca) ||
             bioset_init(&ca->replica_set, 4,
                         offsetof(struct bch_write_bio, bio), 0) ||
diff --git a/fs/bcachefs/super.h b/fs/bcachefs/super.h

index 91df0d7293221d4eb44e091171d1ffdedb176f75..92ef3e7c8dc2a4ebbfd822045dd7b06bea7a6cca 100644 (file)
--- a/fs/bcachefs/super.h
+++ b/fs/bcachefs/super.h
@@ -218,6 +218,7 @@ struct bch_dev *bch2_dev_lookup(struct bch_fs *, const char *);
  bool bch2_fs_emergency_read_only(struct bch_fs *);
  void bch2_fs_read_only(struct bch_fs *);
  
+int __bch2_fs_read_write(struct bch_fs *, bool);
  int bch2_fs_read_write(struct bch_fs *);
  int bch2_fs_read_write_early(struct bch_fs *);
  
diff --git a/fs/bcachefs/super_types.h b/fs/bcachefs/super_types.h

index 04a15729a244ca98d6e94d66746e4de6286ee8bd..6d0168a73ee47d7d66a82006a058ef129820d300 100644 (file)
--- a/fs/bcachefs/super_types.h
+++ b/fs/bcachefs/super_types.h
@@ -12,6 +12,7 @@ struct bch_sb_handle {
         unsigned                have_layout:1;
         unsigned                have_bio:1;
         unsigned                fs_sb:1;
+       u64                     seq;
  };
  
  struct bch_devs_mask {
author	Kent Overstreet <kent.overstreet@gmail.com>
	Fri, 22 Mar 2019 03:13:46 +0000 (23:13 -0400)
committer	Kent Overstreet <kent.overstreet@linux.dev>
	Sun, 22 Oct 2023 21:08:18 +0000 (17:08 -0400)
fs/bcachefs/bcachefs.h		patch \| blob \| blame \| history
fs/bcachefs/fs.c		patch \| blob \| blame \| history
fs/bcachefs/recovery.c		patch \| blob \| blame \| history
fs/bcachefs/super-io.c		patch \| blob \| blame \| history
fs/bcachefs/super-io.h		patch \| blob \| blame \| history
fs/bcachefs/super.c		patch \| blob \| blame \| history
fs/bcachefs/super.h		patch \| blob \| blame \| history
fs/bcachefs/super_types.h		patch \| blob \| blame \| history