Linux 2.6.38-rc2
[linux-2.6-block.git] / fs / nilfs2 / super.c
CommitLineData
783f6184
RK
1/*
2 * super.c - NILFS module and super block management.
3 *
4 * Copyright (C) 2005-2008 Nippon Telegraph and Telephone Corporation.
5 *
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License as published by
8 * the Free Software Foundation; either version 2 of the License, or
9 * (at your option) any later version.
10 *
11 * This program is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 * GNU General Public License for more details.
15 *
16 * You should have received a copy of the GNU General Public License
17 * along with this program; if not, write to the Free Software
18 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
19 *
20 * Written by Ryusuke Konishi <ryusuke@osrg.net>
21 */
22/*
23 * linux/fs/ext2/super.c
24 *
25 * Copyright (C) 1992, 1993, 1994, 1995
26 * Remy Card (card@masi.ibp.fr)
27 * Laboratoire MASI - Institut Blaise Pascal
28 * Universite Pierre et Marie Curie (Paris VI)
29 *
30 * from
31 *
32 * linux/fs/minix/inode.c
33 *
34 * Copyright (C) 1991, 1992 Linus Torvalds
35 *
36 * Big-endian to little-endian byte-swapping/bitmaps by
37 * David S. Miller (davem@caip.rutgers.edu), 1995
38 */
39
40#include <linux/module.h>
41#include <linux/string.h>
42#include <linux/slab.h>
43#include <linux/init.h>
44#include <linux/blkdev.h>
45#include <linux/parser.h>
46#include <linux/random.h>
47#include <linux/crc32.h>
783f6184
RK
48#include <linux/vfs.h>
49#include <linux/writeback.h>
b58a285b
JS
50#include <linux/seq_file.h>
51#include <linux/mount.h>
783f6184 52#include "nilfs.h"
8e656fd5 53#include "export.h"
783f6184
RK
54#include "mdt.h"
55#include "alloc.h"
05d0e94b
RK
56#include "btree.h"
57#include "btnode.h"
783f6184
RK
58#include "page.h"
59#include "cpfile.h"
60#include "ifile.h"
61#include "dat.h"
62#include "segment.h"
63#include "segbuf.h"
64
65MODULE_AUTHOR("NTT Corp.");
66MODULE_DESCRIPTION("A New Implementation of the Log-structured Filesystem "
67 "(NILFS)");
783f6184
RK
68MODULE_LICENSE("GPL");
69
abc0b50b 70static struct kmem_cache *nilfs_inode_cachep;
41c88bd7
LH
71struct kmem_cache *nilfs_transaction_cachep;
72struct kmem_cache *nilfs_segbuf_cachep;
73struct kmem_cache *nilfs_btree_path_cache;
74
5beb6e0b 75static int nilfs_setup_super(struct nilfs_sb_info *sbi, int is_mount);
783f6184 76static int nilfs_remount(struct super_block *sb, int *flags, char *data);
783f6184 77
c8a11c8a
RK
78static void nilfs_set_error(struct nilfs_sb_info *sbi)
79{
80 struct the_nilfs *nilfs = sbi->s_nilfs;
d26493b6 81 struct nilfs_super_block **sbp;
c8a11c8a
RK
82
83 down_write(&nilfs->ns_sem);
84 if (!(nilfs->ns_mount_state & NILFS_ERROR_FS)) {
85 nilfs->ns_mount_state |= NILFS_ERROR_FS;
b2ac86e1 86 sbp = nilfs_prepare_super(sbi, 0);
d26493b6
JS
87 if (likely(sbp)) {
88 sbp[0]->s_state |= cpu_to_le16(NILFS_ERROR_FS);
b2ac86e1
JS
89 if (sbp[1])
90 sbp[1]->s_state |= cpu_to_le16(NILFS_ERROR_FS);
91 nilfs_commit_super(sbi, NILFS_SB_COMMIT_ALL);
d26493b6 92 }
c8a11c8a
RK
93 }
94 up_write(&nilfs->ns_sem);
95}
96
783f6184
RK
97/**
98 * nilfs_error() - report failure condition on a filesystem
99 *
100 * nilfs_error() sets an ERROR_FS flag on the superblock as well as
101 * reporting an error message. It should be called when NILFS detects
102 * incoherences or defects of meta data on disk. As for sustainable
103 * errors such as a single-shot I/O error, nilfs_warning() or the printk()
104 * function should be used instead.
105 *
106 * The segment constructor must not call this function because it can
107 * kill itself.
108 */
109void nilfs_error(struct super_block *sb, const char *function,
110 const char *fmt, ...)
111{
112 struct nilfs_sb_info *sbi = NILFS_SB(sb);
b004a5eb 113 struct va_format vaf;
783f6184
RK
114 va_list args;
115
116 va_start(args, fmt);
b004a5eb
JP
117
118 vaf.fmt = fmt;
119 vaf.va = &args;
120
121 printk(KERN_CRIT "NILFS error (device %s): %s: %pV\n",
122 sb->s_id, function, &vaf);
123
783f6184
RK
124 va_end(args);
125
126 if (!(sb->s_flags & MS_RDONLY)) {
c8a11c8a 127 nilfs_set_error(sbi);
783f6184
RK
128
129 if (nilfs_test_opt(sbi, ERRORS_RO)) {
130 printk(KERN_CRIT "Remounting filesystem read-only\n");
131 sb->s_flags |= MS_RDONLY;
132 }
133 }
134
135 if (nilfs_test_opt(sbi, ERRORS_PANIC))
136 panic("NILFS (device %s): panic forced after error\n",
137 sb->s_id);
138}
139
140void nilfs_warning(struct super_block *sb, const char *function,
141 const char *fmt, ...)
142{
b004a5eb 143 struct va_format vaf;
783f6184
RK
144 va_list args;
145
146 va_start(args, fmt);
b004a5eb
JP
147
148 vaf.fmt = fmt;
149 vaf.va = &args;
150
151 printk(KERN_WARNING "NILFS warning (device %s): %s: %pV\n",
152 sb->s_id, function, &vaf);
153
783f6184
RK
154 va_end(args);
155}
156
783f6184 157
2879ed66 158struct inode *nilfs_alloc_inode(struct super_block *sb)
783f6184
RK
159{
160 struct nilfs_inode_info *ii;
161
162 ii = kmem_cache_alloc(nilfs_inode_cachep, GFP_NOFS);
163 if (!ii)
164 return NULL;
165 ii->i_bh = NULL;
166 ii->i_state = 0;
0e14a359 167 ii->i_cno = 0;
783f6184 168 ii->vfs_inode.i_version = 1;
2879ed66 169 nilfs_btnode_cache_init(&ii->i_btnode_cache, sb->s_bdi);
783f6184
RK
170 return &ii->vfs_inode;
171}
172
fa0d7e3d 173static void nilfs_i_callback(struct rcu_head *head)
783f6184 174{
fa0d7e3d 175 struct inode *inode = container_of(head, struct inode, i_rcu);
b91c9a97
RK
176 struct nilfs_mdt_info *mdi = NILFS_MDT(inode);
177
fa0d7e3d
NP
178 INIT_LIST_HEAD(&inode->i_dentry);
179
b91c9a97
RK
180 if (mdi) {
181 kfree(mdi->mi_bgl); /* kfree(NULL) is safe */
182 kfree(mdi);
183 }
783f6184
RK
184 kmem_cache_free(nilfs_inode_cachep, NILFS_I(inode));
185}
186
fa0d7e3d
NP
187void nilfs_destroy_inode(struct inode *inode)
188{
189 call_rcu(&inode->i_rcu, nilfs_i_callback);
190}
191
b2ac86e1 192static int nilfs_sync_super(struct nilfs_sb_info *sbi, int flag)
783f6184
RK
193{
194 struct the_nilfs *nilfs = sbi->s_nilfs;
195 int err;
783f6184 196
783f6184 197 retry:
e339ad31 198 set_buffer_dirty(nilfs->ns_sbh[0]);
87e99511
CH
199 if (nilfs_test_opt(sbi, BARRIER)) {
200 err = __sync_dirty_buffer(nilfs->ns_sbh[0],
f8c131f5 201 WRITE_SYNC | WRITE_FLUSH_FUA);
87e99511
CH
202 } else {
203 err = sync_dirty_buffer(nilfs->ns_sbh[0]);
783f6184 204 }
87e99511 205
e339ad31 206 if (unlikely(err)) {
783f6184
RK
207 printk(KERN_ERR
208 "NILFS: unable to write superblock (err=%d)\n", err);
e339ad31 209 if (err == -EIO && nilfs->ns_sbh[1]) {
b2ac86e1
JS
210 /*
211 * sbp[0] points to newer log than sbp[1],
212 * so copy sbp[0] to sbp[1] to take over sbp[0].
213 */
214 memcpy(nilfs->ns_sbp[1], nilfs->ns_sbp[0],
215 nilfs->ns_sbsize);
e339ad31
RK
216 nilfs_fall_back_super_block(nilfs);
217 goto retry;
218 }
219 } else {
220 struct nilfs_super_block *sbp = nilfs->ns_sbp[0];
221
b2ac86e1
JS
222 nilfs->ns_sbwcount++;
223
e339ad31
RK
224 /*
225 * The latest segment becomes trailable from the position
226 * written in superblock.
227 */
783f6184 228 clear_nilfs_discontinued(nilfs);
e339ad31
RK
229
230 /* update GC protection for recent segments */
231 if (nilfs->ns_sbh[1]) {
b2ac86e1 232 if (flag == NILFS_SB_COMMIT_ALL) {
e339ad31 233 set_buffer_dirty(nilfs->ns_sbh[1]);
b2ac86e1
JS
234 if (sync_dirty_buffer(nilfs->ns_sbh[1]) < 0)
235 goto out;
e339ad31 236 }
b2ac86e1
JS
237 if (le64_to_cpu(nilfs->ns_sbp[1]->s_last_cno) <
238 le64_to_cpu(nilfs->ns_sbp[0]->s_last_cno))
239 sbp = nilfs->ns_sbp[1];
e339ad31 240 }
783f6184 241
b2ac86e1
JS
242 spin_lock(&nilfs->ns_last_segment_lock);
243 nilfs->ns_prot_seq = le64_to_cpu(sbp->s_last_seq);
244 spin_unlock(&nilfs->ns_last_segment_lock);
245 }
246 out:
783f6184
RK
247 return err;
248}
249
60f46b7e
RK
250void nilfs_set_log_cursor(struct nilfs_super_block *sbp,
251 struct the_nilfs *nilfs)
252{
253 sector_t nfreeblocks;
254
255 /* nilfs->ns_sem must be locked by the caller. */
256 nilfs_count_free_blocks(nilfs, &nfreeblocks);
257 sbp->s_free_blocks_count = cpu_to_le64(nfreeblocks);
258
259 spin_lock(&nilfs->ns_last_segment_lock);
260 sbp->s_last_seq = cpu_to_le64(nilfs->ns_last_seq);
261 sbp->s_last_pseg = cpu_to_le64(nilfs->ns_last_pseg);
262 sbp->s_last_cno = cpu_to_le64(nilfs->ns_last_cno);
263 spin_unlock(&nilfs->ns_last_segment_lock);
264}
265
b2ac86e1
JS
266struct nilfs_super_block **nilfs_prepare_super(struct nilfs_sb_info *sbi,
267 int flip)
783f6184
RK
268{
269 struct the_nilfs *nilfs = sbi->s_nilfs;
e339ad31 270 struct nilfs_super_block **sbp = nilfs->ns_sbp;
783f6184 271
d26493b6 272 /* nilfs->ns_sem must be locked by the caller. */
34cb9b5c 273 if (sbp[0]->s_magic != cpu_to_le16(NILFS_SUPER_MAGIC)) {
d26493b6
JS
274 if (sbp[1] &&
275 sbp[1]->s_magic == cpu_to_le16(NILFS_SUPER_MAGIC)) {
b2ac86e1 276 memcpy(sbp[0], sbp[1], nilfs->ns_sbsize);
d26493b6 277 } else {
e339ad31
RK
278 printk(KERN_CRIT "NILFS: superblock broke on dev %s\n",
279 sbi->s_super->s_id);
d26493b6 280 return NULL;
e339ad31 281 }
b2ac86e1
JS
282 } else if (sbp[1] &&
283 sbp[1]->s_magic != cpu_to_le16(NILFS_SUPER_MAGIC)) {
284 memcpy(sbp[1], sbp[0], nilfs->ns_sbsize);
e339ad31 285 }
b2ac86e1
JS
286
287 if (flip && sbp[1])
288 nilfs_swap_super_block(nilfs);
289
d26493b6
JS
290 return sbp;
291}
292
b2ac86e1 293int nilfs_commit_super(struct nilfs_sb_info *sbi, int flag)
d26493b6
JS
294{
295 struct the_nilfs *nilfs = sbi->s_nilfs;
296 struct nilfs_super_block **sbp = nilfs->ns_sbp;
297 time_t t;
298
299 /* nilfs->ns_sem must be locked by the caller. */
e339ad31 300 t = get_seconds();
b2ac86e1 301 nilfs->ns_sbwtime = t;
e339ad31
RK
302 sbp[0]->s_wtime = cpu_to_le64(t);
303 sbp[0]->s_sum = 0;
304 sbp[0]->s_sum = cpu_to_le32(crc32_le(nilfs->ns_crc_seed,
305 (unsigned char *)sbp[0],
306 nilfs->ns_sbsize));
b2ac86e1
JS
307 if (flag == NILFS_SB_COMMIT_ALL && sbp[1]) {
308 sbp[1]->s_wtime = sbp[0]->s_wtime;
309 sbp[1]->s_sum = 0;
310 sbp[1]->s_sum = cpu_to_le32(crc32_le(nilfs->ns_crc_seed,
311 (unsigned char *)sbp[1],
312 nilfs->ns_sbsize));
e339ad31 313 }
e605f0a7 314 clear_nilfs_sb_dirty(nilfs);
b2ac86e1 315 return nilfs_sync_super(sbi, flag);
783f6184
RK
316}
317
7ecaa46c
RK
318/**
319 * nilfs_cleanup_super() - write filesystem state for cleanup
320 * @sbi: nilfs_sb_info to be unmounted or degraded to read-only
321 *
322 * This function restores state flags in the on-disk super block.
323 * This will set "clean" flag (i.e. NILFS_VALID_FS) unless the
324 * filesystem was not clean previously.
325 */
326int nilfs_cleanup_super(struct nilfs_sb_info *sbi)
327{
d26493b6 328 struct nilfs_super_block **sbp;
b2ac86e1 329 int flag = NILFS_SB_COMMIT;
d26493b6 330 int ret = -EIO;
7ecaa46c 331
b2ac86e1 332 sbp = nilfs_prepare_super(sbi, 0);
d26493b6
JS
333 if (sbp) {
334 sbp[0]->s_state = cpu_to_le16(sbi->s_nilfs->ns_mount_state);
b2ac86e1
JS
335 nilfs_set_log_cursor(sbp[0], sbi->s_nilfs);
336 if (sbp[1] && sbp[0]->s_last_cno == sbp[1]->s_last_cno) {
337 /*
338 * make the "clean" flag also to the opposite
339 * super block if both super blocks point to
340 * the same checkpoint.
341 */
342 sbp[1]->s_state = sbp[0]->s_state;
343 flag = NILFS_SB_COMMIT_ALL;
344 }
345 ret = nilfs_commit_super(sbi, flag);
d26493b6 346 }
7ecaa46c
RK
347 return ret;
348}
349
783f6184
RK
350static void nilfs_put_super(struct super_block *sb)
351{
352 struct nilfs_sb_info *sbi = NILFS_SB(sb);
353 struct the_nilfs *nilfs = sbi->s_nilfs;
354
355 nilfs_detach_segment_constructor(sbi);
356
357 if (!(sb->s_flags & MS_RDONLY)) {
358 down_write(&nilfs->ns_sem);
7ecaa46c 359 nilfs_cleanup_super(sbi);
783f6184
RK
360 up_write(&nilfs->ns_sem);
361 }
362
f1e89c86
RK
363 iput(nilfs->ns_sufile);
364 iput(nilfs->ns_cpfile);
365 iput(nilfs->ns_dat);
366
348fe8da 367 destroy_nilfs(nilfs);
783f6184
RK
368 sbi->s_super = NULL;
369 sb->s_fs_info = NULL;
f11459ad 370 kfree(sbi);
783f6184
RK
371}
372
783f6184
RK
373static int nilfs_sync_fs(struct super_block *sb, int wait)
374{
6233caa9
JS
375 struct nilfs_sb_info *sbi = NILFS_SB(sb);
376 struct the_nilfs *nilfs = sbi->s_nilfs;
d26493b6 377 struct nilfs_super_block **sbp;
783f6184
RK
378 int err = 0;
379
380 /* This function is called when super block should be written back */
381 if (wait)
382 err = nilfs_construct_segment(sb);
6233caa9
JS
383
384 down_write(&nilfs->ns_sem);
d26493b6 385 if (nilfs_sb_dirty(nilfs)) {
b2ac86e1
JS
386 sbp = nilfs_prepare_super(sbi, nilfs_sb_will_flip(nilfs));
387 if (likely(sbp)) {
388 nilfs_set_log_cursor(sbp[0], nilfs);
389 nilfs_commit_super(sbi, NILFS_SB_COMMIT);
390 }
d26493b6 391 }
6233caa9
JS
392 up_write(&nilfs->ns_sem);
393
783f6184
RK
394 return err;
395}
396
4d8d9293
RK
397int nilfs_attach_checkpoint(struct nilfs_sb_info *sbi, __u64 cno, int curr_mnt,
398 struct nilfs_root **rootp)
783f6184
RK
399{
400 struct the_nilfs *nilfs = sbi->s_nilfs;
4d8d9293 401 struct nilfs_root *root;
783f6184
RK
402 struct nilfs_checkpoint *raw_cp;
403 struct buffer_head *bh_cp;
4d8d9293 404 int err = -ENOMEM;
783f6184 405
4d8d9293
RK
406 root = nilfs_find_or_create_root(
407 nilfs, curr_mnt ? NILFS_CPTREE_CURRENT_CNO : cno);
408 if (!root)
409 return err;
783f6184 410
e912a5b6
RK
411 if (root->ifile)
412 goto reuse; /* already attached checkpoint */
783f6184 413
1154ecbd 414 down_read(&nilfs->ns_segctor_sem);
783f6184
RK
415 err = nilfs_cpfile_get_checkpoint(nilfs->ns_cpfile, cno, 0, &raw_cp,
416 &bh_cp);
1154ecbd 417 up_read(&nilfs->ns_segctor_sem);
783f6184
RK
418 if (unlikely(err)) {
419 if (err == -ENOENT || err == -EINVAL) {
420 printk(KERN_ERR
421 "NILFS: Invalid checkpoint "
422 "(checkpoint number=%llu)\n",
423 (unsigned long long)cno);
424 err = -EINVAL;
425 }
426 goto failed;
427 }
f1e89c86
RK
428
429 err = nilfs_ifile_read(sbi->s_super, root, nilfs->ns_inode_size,
430 &raw_cp->cp_ifile_inode, &root->ifile);
431 if (err)
783f6184 432 goto failed_bh;
b7c06342
RK
433
434 atomic_set(&root->inodes_count, le64_to_cpu(raw_cp->cp_inodes_count));
435 atomic_set(&root->blocks_count, le64_to_cpu(raw_cp->cp_blocks_count));
783f6184
RK
436
437 nilfs_cpfile_put_checkpoint(nilfs->ns_cpfile, cno, bh_cp);
4d8d9293 438
e912a5b6 439 reuse:
4d8d9293 440 *rootp = root;
783f6184
RK
441 return 0;
442
443 failed_bh:
444 nilfs_cpfile_put_checkpoint(nilfs->ns_cpfile, cno, bh_cp);
445 failed:
4d8d9293 446 nilfs_put_root(root);
783f6184
RK
447
448 return err;
449}
783f6184 450
5beb6e0b
RK
451static int nilfs_freeze(struct super_block *sb)
452{
453 struct nilfs_sb_info *sbi = NILFS_SB(sb);
454 struct the_nilfs *nilfs = sbi->s_nilfs;
455 int err;
456
457 if (sb->s_flags & MS_RDONLY)
458 return 0;
783f6184 459
5beb6e0b
RK
460 /* Mark super block clean */
461 down_write(&nilfs->ns_sem);
462 err = nilfs_cleanup_super(sbi);
463 up_write(&nilfs->ns_sem);
783f6184
RK
464 return err;
465}
466
5beb6e0b 467static int nilfs_unfreeze(struct super_block *sb)
783f6184 468{
5beb6e0b 469 struct nilfs_sb_info *sbi = NILFS_SB(sb);
783f6184
RK
470 struct the_nilfs *nilfs = sbi->s_nilfs;
471
5beb6e0b
RK
472 if (sb->s_flags & MS_RDONLY)
473 return 0;
474
475 down_write(&nilfs->ns_sem);
476 nilfs_setup_super(sbi, false);
477 up_write(&nilfs->ns_sem);
478 return 0;
783f6184
RK
479}
480
783f6184
RK
481static int nilfs_statfs(struct dentry *dentry, struct kstatfs *buf)
482{
483 struct super_block *sb = dentry->d_sb;
b7c06342
RK
484 struct nilfs_root *root = NILFS_I(dentry->d_inode)->i_root;
485 struct the_nilfs *nilfs = root->nilfs;
c306af23 486 u64 id = huge_encode_dev(sb->s_bdev->bd_dev);
783f6184
RK
487 unsigned long long blocks;
488 unsigned long overhead;
489 unsigned long nrsvblocks;
490 sector_t nfreeblocks;
783f6184
RK
491 int err;
492
493 /*
494 * Compute all of the segment blocks
495 *
496 * The blocks before first segment and after last segment
497 * are excluded.
498 */
499 blocks = nilfs->ns_blocks_per_segment * nilfs->ns_nsegments
500 - nilfs->ns_first_data_block;
501 nrsvblocks = nilfs->ns_nrsvsegs * nilfs->ns_blocks_per_segment;
502
503 /*
504 * Compute the overhead
505 *
7a65004b 506 * When distributing meta data blocks outside segment structure,
783f6184
RK
507 * We must count them as the overhead.
508 */
509 overhead = 0;
510
511 err = nilfs_count_free_blocks(nilfs, &nfreeblocks);
512 if (unlikely(err))
513 return err;
514
515 buf->f_type = NILFS_SUPER_MAGIC;
516 buf->f_bsize = sb->s_blocksize;
517 buf->f_blocks = blocks - overhead;
518 buf->f_bfree = nfreeblocks;
519 buf->f_bavail = (buf->f_bfree >= nrsvblocks) ?
520 (buf->f_bfree - nrsvblocks) : 0;
b7c06342 521 buf->f_files = atomic_read(&root->inodes_count);
783f6184
RK
522 buf->f_ffree = 0; /* nilfs_count_free_inodes(sb); */
523 buf->f_namelen = NILFS_NAME_LEN;
c306af23
RK
524 buf->f_fsid.val[0] = (u32)id;
525 buf->f_fsid.val[1] = (u32)(id >> 32);
526
783f6184
RK
527 return 0;
528}
529
b58a285b
JS
530static int nilfs_show_options(struct seq_file *seq, struct vfsmount *vfs)
531{
532 struct super_block *sb = vfs->mnt_sb;
533 struct nilfs_sb_info *sbi = NILFS_SB(sb);
f11459ad 534 struct nilfs_root *root = NILFS_I(vfs->mnt_root->d_inode)->i_root;
b58a285b
JS
535
536 if (!nilfs_test_opt(sbi, BARRIER))
c6b4d57d 537 seq_puts(seq, ",nobarrier");
f11459ad
RK
538 if (root->cno != NILFS_CPTREE_CURRENT_CNO)
539 seq_printf(seq, ",cp=%llu", (unsigned long long)root->cno);
b58a285b 540 if (nilfs_test_opt(sbi, ERRORS_PANIC))
c6b4d57d 541 seq_puts(seq, ",errors=panic");
277a6a34 542 if (nilfs_test_opt(sbi, ERRORS_CONT))
c6b4d57d 543 seq_puts(seq, ",errors=continue");
b58a285b 544 if (nilfs_test_opt(sbi, STRICT_ORDER))
c6b4d57d 545 seq_puts(seq, ",order=strict");
0234576d 546 if (nilfs_test_opt(sbi, NORECOVERY))
c6b4d57d 547 seq_puts(seq, ",norecovery");
e902ec99 548 if (nilfs_test_opt(sbi, DISCARD))
c6b4d57d 549 seq_puts(seq, ",discard");
b58a285b
JS
550
551 return 0;
552}
553
b87221de 554static const struct super_operations nilfs_sops = {
783f6184
RK
555 .alloc_inode = nilfs_alloc_inode,
556 .destroy_inode = nilfs_destroy_inode,
557 .dirty_inode = nilfs_dirty_inode,
558 /* .write_inode = nilfs_write_inode, */
559 /* .put_inode = nilfs_put_inode, */
560 /* .drop_inode = nilfs_drop_inode, */
6fd1e5c9 561 .evict_inode = nilfs_evict_inode,
783f6184 562 .put_super = nilfs_put_super,
1dfa2710 563 /* .write_super = nilfs_write_super, */
783f6184 564 .sync_fs = nilfs_sync_fs,
5beb6e0b
RK
565 .freeze_fs = nilfs_freeze,
566 .unfreeze_fs = nilfs_unfreeze,
783f6184
RK
567 /* .write_super_lockfs */
568 /* .unlockfs */
569 .statfs = nilfs_statfs,
570 .remount_fs = nilfs_remount,
783f6184 571 /* .umount_begin */
b58a285b 572 .show_options = nilfs_show_options
783f6184
RK
573};
574
783f6184
RK
575enum {
576 Opt_err_cont, Opt_err_panic, Opt_err_ro,
773bc4f3 577 Opt_barrier, Opt_nobarrier, Opt_snapshot, Opt_order, Opt_norecovery,
802d3177 578 Opt_discard, Opt_nodiscard, Opt_err,
783f6184
RK
579};
580
581static match_table_t tokens = {
582 {Opt_err_cont, "errors=continue"},
583 {Opt_err_panic, "errors=panic"},
584 {Opt_err_ro, "errors=remount-ro"},
773bc4f3 585 {Opt_barrier, "barrier"},
91f1953b 586 {Opt_nobarrier, "nobarrier"},
783f6184
RK
587 {Opt_snapshot, "cp=%u"},
588 {Opt_order, "order=%s"},
0234576d 589 {Opt_norecovery, "norecovery"},
e902ec99 590 {Opt_discard, "discard"},
802d3177 591 {Opt_nodiscard, "nodiscard"},
783f6184
RK
592 {Opt_err, NULL}
593};
594
7c017457 595static int parse_options(char *options, struct super_block *sb, int is_remount)
783f6184
RK
596{
597 struct nilfs_sb_info *sbi = NILFS_SB(sb);
598 char *p;
599 substring_t args[MAX_OPT_ARGS];
783f6184
RK
600
601 if (!options)
602 return 1;
603
604 while ((p = strsep(&options, ",")) != NULL) {
605 int token;
606 if (!*p)
607 continue;
608
609 token = match_token(p, tokens, args);
610 switch (token) {
773bc4f3
RK
611 case Opt_barrier:
612 nilfs_set_opt(sbi, BARRIER);
613 break;
91f1953b
JS
614 case Opt_nobarrier:
615 nilfs_clear_opt(sbi, BARRIER);
783f6184
RK
616 break;
617 case Opt_order:
618 if (strcmp(args[0].from, "relaxed") == 0)
619 /* Ordered data semantics */
620 nilfs_clear_opt(sbi, STRICT_ORDER);
621 else if (strcmp(args[0].from, "strict") == 0)
622 /* Strict in-order semantics */
623 nilfs_set_opt(sbi, STRICT_ORDER);
624 else
625 return 0;
626 break;
627 case Opt_err_panic:
628 nilfs_write_opt(sbi, ERROR_MODE, ERRORS_PANIC);
629 break;
630 case Opt_err_ro:
631 nilfs_write_opt(sbi, ERROR_MODE, ERRORS_RO);
632 break;
633 case Opt_err_cont:
634 nilfs_write_opt(sbi, ERROR_MODE, ERRORS_CONT);
635 break;
636 case Opt_snapshot:
7c017457 637 if (is_remount) {
f11459ad
RK
638 printk(KERN_ERR
639 "NILFS: \"%s\" option is invalid "
640 "for remount.\n", p);
783f6184 641 return 0;
7c017457 642 }
783f6184 643 break;
0234576d
RK
644 case Opt_norecovery:
645 nilfs_set_opt(sbi, NORECOVERY);
646 break;
e902ec99
JS
647 case Opt_discard:
648 nilfs_set_opt(sbi, DISCARD);
649 break;
802d3177
RK
650 case Opt_nodiscard:
651 nilfs_clear_opt(sbi, DISCARD);
652 break;
783f6184
RK
653 default:
654 printk(KERN_ERR
655 "NILFS: Unrecognized mount option \"%s\"\n", p);
656 return 0;
657 }
658 }
659 return 1;
660}
661
662static inline void
663nilfs_set_default_options(struct nilfs_sb_info *sbi,
664 struct nilfs_super_block *sbp)
665{
666 sbi->s_mount_opt =
277a6a34 667 NILFS_MOUNT_ERRORS_RO | NILFS_MOUNT_BARRIER;
783f6184
RK
668}
669
5beb6e0b 670static int nilfs_setup_super(struct nilfs_sb_info *sbi, int is_mount)
783f6184
RK
671{
672 struct the_nilfs *nilfs = sbi->s_nilfs;
d26493b6
JS
673 struct nilfs_super_block **sbp;
674 int max_mnt_count;
675 int mnt_count;
676
677 /* nilfs->ns_sem must be locked by the caller. */
b2ac86e1 678 sbp = nilfs_prepare_super(sbi, 0);
d26493b6
JS
679 if (!sbp)
680 return -EIO;
681
5beb6e0b
RK
682 if (!is_mount)
683 goto skip_mount_setup;
684
d26493b6
JS
685 max_mnt_count = le16_to_cpu(sbp[0]->s_max_mnt_count);
686 mnt_count = le16_to_cpu(sbp[0]->s_mnt_count);
783f6184 687
f50a4c81 688 if (nilfs->ns_mount_state & NILFS_ERROR_FS) {
783f6184
RK
689 printk(KERN_WARNING
690 "NILFS warning: mounting fs with errors\n");
691#if 0
692 } else if (max_mnt_count >= 0 && mnt_count >= max_mnt_count) {
693 printk(KERN_WARNING
694 "NILFS warning: maximal mount count reached\n");
695#endif
696 }
697 if (!max_mnt_count)
d26493b6 698 sbp[0]->s_max_mnt_count = cpu_to_le16(NILFS_DFL_MAX_MNT_COUNT);
783f6184 699
d26493b6 700 sbp[0]->s_mnt_count = cpu_to_le16(mnt_count + 1);
5beb6e0b
RK
701 sbp[0]->s_mtime = cpu_to_le64(get_seconds());
702
703skip_mount_setup:
d26493b6
JS
704 sbp[0]->s_state =
705 cpu_to_le16(le16_to_cpu(sbp[0]->s_state) & ~NILFS_VALID_FS);
b2ac86e1
JS
706 /* synchronize sbp[1] with sbp[0] */
707 memcpy(sbp[1], sbp[0], nilfs->ns_sbsize);
708 return nilfs_commit_super(sbi, NILFS_SB_COMMIT_ALL);
783f6184
RK
709}
710
e339ad31
RK
711struct nilfs_super_block *nilfs_read_super_block(struct super_block *sb,
712 u64 pos, int blocksize,
713 struct buffer_head **pbh)
783f6184 714{
e339ad31
RK
715 unsigned long long sb_index = pos;
716 unsigned long offset;
783f6184 717
e339ad31 718 offset = do_div(sb_index, blocksize);
783f6184 719 *pbh = sb_bread(sb, sb_index);
e339ad31 720 if (!*pbh)
783f6184 721 return NULL;
783f6184
RK
722 return (struct nilfs_super_block *)((char *)(*pbh)->b_data + offset);
723}
724
783f6184
RK
725int nilfs_store_magic_and_option(struct super_block *sb,
726 struct nilfs_super_block *sbp,
727 char *data)
728{
729 struct nilfs_sb_info *sbi = NILFS_SB(sb);
730
783f6184
RK
731 sb->s_magic = le16_to_cpu(sbp->s_magic);
732
733 /* FS independent flags */
734#ifdef NILFS_ATIME_DISABLE
735 sb->s_flags |= MS_NOATIME;
736#endif
737
783f6184
RK
738 nilfs_set_default_options(sbi, sbp);
739
740 sbi->s_resuid = le16_to_cpu(sbp->s_def_resuid);
741 sbi->s_resgid = le16_to_cpu(sbp->s_def_resgid);
742 sbi->s_interval = le32_to_cpu(sbp->s_c_interval);
743 sbi->s_watermark = le32_to_cpu(sbp->s_c_block_max);
744
7c017457 745 return !parse_options(data, sb, 0) ? -EINVAL : 0 ;
783f6184
RK
746}
747
c5ca48aa
RK
748int nilfs_check_feature_compatibility(struct super_block *sb,
749 struct nilfs_super_block *sbp)
750{
751 __u64 features;
752
753 features = le64_to_cpu(sbp->s_feature_incompat) &
754 ~NILFS_FEATURE_INCOMPAT_SUPP;
755 if (features) {
756 printk(KERN_ERR "NILFS: couldn't mount because of unsupported "
757 "optional features (%llx)\n",
758 (unsigned long long)features);
759 return -EINVAL;
760 }
761 features = le64_to_cpu(sbp->s_feature_compat_ro) &
762 ~NILFS_FEATURE_COMPAT_RO_SUPP;
763 if (!(sb->s_flags & MS_RDONLY) && features) {
764 printk(KERN_ERR "NILFS: couldn't mount RDWR because of "
765 "unsupported optional features (%llx)\n",
766 (unsigned long long)features);
767 return -EINVAL;
768 }
769 return 0;
770}
771
367ea334
RK
772static int nilfs_get_root_dentry(struct super_block *sb,
773 struct nilfs_root *root,
774 struct dentry **root_dentry)
775{
776 struct inode *inode;
777 struct dentry *dentry;
778 int ret = 0;
779
780 inode = nilfs_iget(sb, root, NILFS_ROOT_INO);
781 if (IS_ERR(inode)) {
782 printk(KERN_ERR "NILFS: get root inode failed\n");
783 ret = PTR_ERR(inode);
784 goto out;
785 }
786 if (!S_ISDIR(inode->i_mode) || !inode->i_blocks || !inode->i_size) {
787 iput(inode);
788 printk(KERN_ERR "NILFS: corrupt root inode.\n");
789 ret = -EINVAL;
790 goto out;
791 }
792
f11459ad
RK
793 if (root->cno == NILFS_CPTREE_CURRENT_CNO) {
794 dentry = d_find_alias(inode);
795 if (!dentry) {
796 dentry = d_alloc_root(inode);
797 if (!dentry) {
798 iput(inode);
799 ret = -ENOMEM;
800 goto failed_dentry;
801 }
802 } else {
803 iput(inode);
804 }
805 } else {
806 dentry = d_obtain_alias(inode);
807 if (IS_ERR(dentry)) {
808 ret = PTR_ERR(dentry);
809 goto failed_dentry;
810 }
367ea334
RK
811 }
812 *root_dentry = dentry;
813 out:
814 return ret;
f11459ad
RK
815
816 failed_dentry:
817 printk(KERN_ERR "NILFS: get root dentry failed\n");
818 goto out;
367ea334
RK
819}
820
ab4d8f7e
RK
821static int nilfs_attach_snapshot(struct super_block *s, __u64 cno,
822 struct dentry **root_dentry)
823{
824 struct the_nilfs *nilfs = NILFS_SB(s)->s_nilfs;
825 struct nilfs_root *root;
826 int ret;
827
828 down_read(&nilfs->ns_segctor_sem);
829 ret = nilfs_cpfile_is_snapshot(nilfs->ns_cpfile, cno);
830 up_read(&nilfs->ns_segctor_sem);
831 if (ret < 0) {
832 ret = (ret == -ENOENT) ? -EINVAL : ret;
833 goto out;
834 } else if (!ret) {
835 printk(KERN_ERR "NILFS: The specified checkpoint is "
836 "not a snapshot (checkpoint number=%llu).\n",
837 (unsigned long long)cno);
838 ret = -EINVAL;
839 goto out;
840 }
841
842 ret = nilfs_attach_checkpoint(NILFS_SB(s), cno, false, &root);
843 if (ret) {
844 printk(KERN_ERR "NILFS: error loading snapshot "
845 "(checkpoint number=%llu).\n",
846 (unsigned long long)cno);
847 goto out;
848 }
849 ret = nilfs_get_root_dentry(s, root, root_dentry);
850 nilfs_put_root(root);
851 out:
852 return ret;
853}
854
f11459ad
RK
855static int nilfs_tree_was_touched(struct dentry *root_dentry)
856{
b7ab39f6 857 return root_dentry->d_count > 1;
f11459ad
RK
858}
859
860/**
861 * nilfs_try_to_shrink_tree() - try to shrink dentries of a checkpoint
862 * @root_dentry: root dentry of the tree to be shrunk
863 *
864 * This function returns true if the tree was in-use.
865 */
866static int nilfs_try_to_shrink_tree(struct dentry *root_dentry)
867{
868 if (have_submounts(root_dentry))
869 return true;
870 shrink_dcache_parent(root_dentry);
871 return nilfs_tree_was_touched(root_dentry);
872}
873
032dbb3b
RK
874int nilfs_checkpoint_is_mounted(struct super_block *sb, __u64 cno)
875{
876 struct the_nilfs *nilfs = NILFS_SB(sb)->s_nilfs;
877 struct nilfs_root *root;
878 struct inode *inode;
879 struct dentry *dentry;
880 int ret;
881
882 if (cno < 0 || cno > nilfs->ns_cno)
883 return false;
884
885 if (cno >= nilfs_last_cno(nilfs))
886 return true; /* protect recent checkpoints */
887
888 ret = false;
889 root = nilfs_lookup_root(NILFS_SB(sb)->s_nilfs, cno);
890 if (root) {
891 inode = nilfs_ilookup(sb, root, NILFS_ROOT_INO);
892 if (inode) {
893 dentry = d_find_alias(inode);
894 if (dentry) {
895 if (nilfs_tree_was_touched(dentry))
896 ret = nilfs_try_to_shrink_tree(dentry);
897 dput(dentry);
898 }
899 iput(inode);
900 }
901 nilfs_put_root(root);
902 }
903 return ret;
904}
905
783f6184
RK
906/**
907 * nilfs_fill_super() - initialize a super block instance
908 * @sb: super_block
909 * @data: mount options
910 * @silent: silent mode flag
783f6184 911 *
aa7dfb89 912 * This function is called exclusively by nilfs->ns_mount_mutex.
783f6184
RK
913 * So, the recovery process is protected from other simultaneous mounts.
914 */
915static int
348fe8da 916nilfs_fill_super(struct super_block *sb, void *data, int silent)
783f6184 917{
348fe8da 918 struct the_nilfs *nilfs;
783f6184 919 struct nilfs_sb_info *sbi;
4d8d9293 920 struct nilfs_root *fsroot;
026a7d63 921 struct backing_dev_info *bdi;
783f6184
RK
922 __u64 cno;
923 int err;
924
925 sbi = kzalloc(sizeof(*sbi), GFP_KERNEL);
926 if (!sbi)
927 return -ENOMEM;
928
929 sb->s_fs_info = sbi;
348fe8da 930 sbi->s_super = sb;
783f6184 931
348fe8da
RK
932 nilfs = alloc_nilfs(sb->s_bdev);
933 if (!nilfs) {
934 err = -ENOMEM;
935 goto failed_sbi;
936 }
783f6184 937 sbi->s_nilfs = nilfs;
783f6184
RK
938
939 err = init_nilfs(nilfs, sbi, (char *)data);
940 if (err)
348fe8da 941 goto failed_nilfs;
783f6184
RK
942
943 spin_lock_init(&sbi->s_inode_lock);
944 INIT_LIST_HEAD(&sbi->s_dirty_files);
783f6184
RK
945
946 /*
947 * Following initialization is overlapped because
948 * nilfs_sb_info structure has been cleared at the beginning.
949 * But we reserve them to keep our interest and make ready
950 * for the future change.
951 */
952 get_random_bytes(&sbi->s_next_generation,
953 sizeof(sbi->s_next_generation));
954 spin_lock_init(&sbi->s_next_gen_lock);
955
956 sb->s_op = &nilfs_sops;
957 sb->s_export_op = &nilfs_export_ops;
958 sb->s_root = NULL;
61239230 959 sb->s_time_gran = 1;
026a7d63
RK
960
961 bdi = sb->s_bdev->bd_inode->i_mapping->backing_dev_info;
962 sb->s_bdi = bdi ? : &default_backing_dev_info;
783f6184 963
f50a4c81
RK
964 err = load_nilfs(nilfs, sbi);
965 if (err)
348fe8da 966 goto failed_nilfs;
f50a4c81 967
783f6184 968 cno = nilfs_last_cno(nilfs);
ab4d8f7e 969 err = nilfs_attach_checkpoint(sbi, cno, true, &fsroot);
783f6184 970 if (err) {
f11459ad
RK
971 printk(KERN_ERR "NILFS: error loading last checkpoint "
972 "(checkpoint number=%llu).\n", (unsigned long long)cno);
f1e89c86 973 goto failed_unload;
783f6184
RK
974 }
975
976 if (!(sb->s_flags & MS_RDONLY)) {
e912a5b6 977 err = nilfs_attach_segment_constructor(sbi, fsroot);
783f6184
RK
978 if (err)
979 goto failed_checkpoint;
980 }
981
367ea334
RK
982 err = nilfs_get_root_dentry(sb, fsroot, &sb->s_root);
983 if (err)
783f6184 984 goto failed_segctor;
783f6184 985
4d8d9293 986 nilfs_put_root(fsroot);
783f6184
RK
987
988 if (!(sb->s_flags & MS_RDONLY)) {
989 down_write(&nilfs->ns_sem);
5beb6e0b 990 nilfs_setup_super(sbi, true);
783f6184
RK
991 up_write(&nilfs->ns_sem);
992 }
993
783f6184
RK
994 return 0;
995
783f6184
RK
996 failed_segctor:
997 nilfs_detach_segment_constructor(sbi);
998
999 failed_checkpoint:
4d8d9293 1000 nilfs_put_root(fsroot);
783f6184 1001
f1e89c86
RK
1002 failed_unload:
1003 iput(nilfs->ns_sufile);
1004 iput(nilfs->ns_cpfile);
1005 iput(nilfs->ns_dat);
1006
348fe8da
RK
1007 failed_nilfs:
1008 destroy_nilfs(nilfs);
783f6184
RK
1009
1010 failed_sbi:
783f6184 1011 sb->s_fs_info = NULL;
f11459ad 1012 kfree(sbi);
783f6184
RK
1013 return err;
1014}
1015
1016static int nilfs_remount(struct super_block *sb, int *flags, char *data)
1017{
1018 struct nilfs_sb_info *sbi = NILFS_SB(sb);
783f6184
RK
1019 struct the_nilfs *nilfs = sbi->s_nilfs;
1020 unsigned long old_sb_flags;
06df0f99 1021 unsigned long old_mount_opt;
f11459ad 1022 int err;
783f6184
RK
1023
1024 old_sb_flags = sb->s_flags;
06df0f99 1025 old_mount_opt = sbi->s_mount_opt;
783f6184 1026
7c017457 1027 if (!parse_options(data, sb, 1)) {
783f6184
RK
1028 err = -EINVAL;
1029 goto restore_opts;
1030 }
1031 sb->s_flags = (sb->s_flags & ~MS_POSIXACL);
1032
d240e067 1033 err = -EINVAL;
783f6184 1034
0234576d
RK
1035 if (!nilfs_valid_fs(nilfs)) {
1036 printk(KERN_WARNING "NILFS (device %s): couldn't "
1037 "remount because the filesystem is in an "
1038 "incomplete recovery state.\n", sb->s_id);
0234576d
RK
1039 goto restore_opts;
1040 }
1041
783f6184
RK
1042 if ((*flags & MS_RDONLY) == (sb->s_flags & MS_RDONLY))
1043 goto out;
1044 if (*flags & MS_RDONLY) {
1045 /* Shutting down the segment constructor */
1046 nilfs_detach_segment_constructor(sbi);
1047 sb->s_flags |= MS_RDONLY;
1048
783f6184
RK
1049 /*
1050 * Remounting a valid RW partition RDONLY, so set
1051 * the RDONLY flag and then mark the partition as valid again.
1052 */
1053 down_write(&nilfs->ns_sem);
7ecaa46c 1054 nilfs_cleanup_super(sbi);
783f6184
RK
1055 up_write(&nilfs->ns_sem);
1056 } else {
c5ca48aa 1057 __u64 features;
e912a5b6 1058 struct nilfs_root *root;
c5ca48aa 1059
783f6184
RK
1060 /*
1061 * Mounting a RDONLY partition read-write, so reread and
1062 * store the current valid flag. (It may have been changed
1063 * by fsck since we originally mounted the partition.)
1064 */
c5ca48aa
RK
1065 down_read(&nilfs->ns_sem);
1066 features = le64_to_cpu(nilfs->ns_sbp[0]->s_feature_compat_ro) &
1067 ~NILFS_FEATURE_COMPAT_RO_SUPP;
1068 up_read(&nilfs->ns_sem);
1069 if (features) {
1070 printk(KERN_WARNING "NILFS (device %s): couldn't "
1071 "remount RDWR because of unsupported optional "
1072 "features (%llx)\n",
1073 sb->s_id, (unsigned long long)features);
1074 err = -EROFS;
1075 goto restore_opts;
1076 }
1077
783f6184 1078 sb->s_flags &= ~MS_RDONLY;
783f6184 1079
e912a5b6
RK
1080 root = NILFS_I(sb->s_root->d_inode)->i_root;
1081 err = nilfs_attach_segment_constructor(sbi, root);
783f6184 1082 if (err)
e59399d0 1083 goto restore_opts;
783f6184
RK
1084
1085 down_write(&nilfs->ns_sem);
5beb6e0b 1086 nilfs_setup_super(sbi, true);
783f6184 1087 up_write(&nilfs->ns_sem);
783f6184
RK
1088 }
1089 out:
1090 return 0;
1091
783f6184
RK
1092 restore_opts:
1093 sb->s_flags = old_sb_flags;
06df0f99 1094 sbi->s_mount_opt = old_mount_opt;
783f6184
RK
1095 return err;
1096}
1097
1098struct nilfs_super_data {
1099 struct block_device *bdev;
6dd47406 1100 struct nilfs_sb_info *sbi;
783f6184
RK
1101 __u64 cno;
1102 int flags;
1103};
1104
1105/**
1106 * nilfs_identify - pre-read mount options needed to identify mount instance
1107 * @data: mount options
1108 * @sd: nilfs_super_data
1109 */
1110static int nilfs_identify(char *data, struct nilfs_super_data *sd)
1111{
1112 char *p, *options = data;
1113 substring_t args[MAX_OPT_ARGS];
c05dbfc2 1114 int token;
783f6184
RK
1115 int ret = 0;
1116
1117 do {
1118 p = strsep(&options, ",");
1119 if (p != NULL && *p) {
1120 token = match_token(p, tokens, args);
1121 if (token == Opt_snapshot) {
c05dbfc2 1122 if (!(sd->flags & MS_RDONLY)) {
783f6184 1123 ret++;
c05dbfc2
RK
1124 } else {
1125 sd->cno = simple_strtoull(args[0].from,
1126 NULL, 0);
1127 /*
1128 * No need to see the end pointer;
1129 * match_token() has done syntax
1130 * checking.
1131 */
1132 if (sd->cno == 0)
1133 ret++;
783f6184
RK
1134 }
1135 }
1136 if (ret)
1137 printk(KERN_ERR
1138 "NILFS: invalid mount option: %s\n", p);
1139 }
1140 if (!options)
1141 break;
1142 BUG_ON(options == data);
1143 *(options - 1) = ',';
1144 } while (!ret);
1145 return ret;
1146}
1147
1148static int nilfs_set_bdev_super(struct super_block *s, void *data)
1149{
f11459ad 1150 s->s_bdev = data;
783f6184
RK
1151 s->s_dev = s->s_bdev->bd_dev;
1152 return 0;
1153}
1154
1155static int nilfs_test_bdev_super(struct super_block *s, void *data)
783f6184 1156{
f11459ad 1157 return (void *)s->s_bdev == data;
783f6184
RK
1158}
1159
e4c59d61
AV
1160static struct dentry *
1161nilfs_mount(struct file_system_type *fs_type, int flags,
1162 const char *dev_name, void *data)
783f6184
RK
1163{
1164 struct nilfs_super_data sd;
33c8e57c 1165 struct super_block *s;
d4d77629 1166 fmode_t mode = FMODE_READ | FMODE_EXCL;
f11459ad
RK
1167 struct dentry *root_dentry;
1168 int err, s_new = false;
783f6184 1169
13e90559
RK
1170 if (!(flags & MS_RDONLY))
1171 mode |= FMODE_WRITE;
1172
d4d77629 1173 sd.bdev = blkdev_get_by_path(dev_name, mode, fs_type);
d6d4c19c 1174 if (IS_ERR(sd.bdev))
e4c59d61 1175 return ERR_CAST(sd.bdev);
783f6184 1176
783f6184
RK
1177 sd.cno = 0;
1178 sd.flags = flags;
1179 if (nilfs_identify((char *)data, &sd)) {
1180 err = -EINVAL;
1181 goto failed;
1182 }
1183
6dd47406 1184 /*
5beb6e0b
RK
1185 * once the super is inserted into the list by sget, s_umount
1186 * will protect the lockfs code from trying to start a snapshot
1187 * while we are mounting
6dd47406 1188 */
5beb6e0b
RK
1189 mutex_lock(&sd.bdev->bd_fsfreeze_mutex);
1190 if (sd.bdev->bd_fsfreeze_count > 0) {
1191 mutex_unlock(&sd.bdev->bd_fsfreeze_mutex);
1192 err = -EBUSY;
1193 goto failed;
1194 }
f11459ad 1195 s = sget(fs_type, nilfs_test_bdev_super, nilfs_set_bdev_super, sd.bdev);
5beb6e0b 1196 mutex_unlock(&sd.bdev->bd_fsfreeze_mutex);
33c8e57c
RK
1197 if (IS_ERR(s)) {
1198 err = PTR_ERR(s);
348fe8da 1199 goto failed;
783f6184
RK
1200 }
1201
1202 if (!s->s_root) {
1203 char b[BDEVNAME_SIZE];
1204
f11459ad
RK
1205 s_new = true;
1206
33c8e57c 1207 /* New superblock instance created */
783f6184 1208 s->s_flags = flags;
4571b82c 1209 s->s_mode = mode;
783f6184
RK
1210 strlcpy(s->s_id, bdevname(sd.bdev, b), sizeof(s->s_id));
1211 sb_set_blocksize(s, block_size(sd.bdev));
1212
348fe8da 1213 err = nilfs_fill_super(s, data, flags & MS_SILENT ? 1 : 0);
783f6184 1214 if (err)
348fe8da 1215 goto failed_super;
783f6184
RK
1216
1217 s->s_flags |= MS_ACTIVE;
f11459ad
RK
1218 } else if (!sd.cno) {
1219 int busy = false;
1220
1221 if (nilfs_tree_was_touched(s->s_root)) {
1222 busy = nilfs_try_to_shrink_tree(s->s_root);
1223 if (busy && (flags ^ s->s_flags) & MS_RDONLY) {
1224 printk(KERN_ERR "NILFS: the device already "
1225 "has a %s mount.\n",
1226 (s->s_flags & MS_RDONLY) ?
1227 "read-only" : "read/write");
1228 err = -EBUSY;
1229 goto failed_super;
1230 }
1231 }
1232 if (!busy) {
1233 /*
1234 * Try remount to setup mount states if the current
1235 * tree is not mounted and only snapshots use this sb.
1236 */
1237 err = nilfs_remount(s, &flags, data);
1238 if (err)
1239 goto failed_super;
1240 }
783f6184
RK
1241 }
1242
f11459ad
RK
1243 if (sd.cno) {
1244 err = nilfs_attach_snapshot(s, sd.cno, &root_dentry);
348fe8da 1245 if (err)
f11459ad 1246 goto failed_super;
f11459ad
RK
1247 } else {
1248 root_dentry = dget(s->s_root);
783f6184
RK
1249 }
1250
f11459ad 1251 if (!s_new)
d4d77629 1252 blkdev_put(sd.bdev, mode);
783f6184 1253
e4c59d61 1254 return root_dentry;
783f6184 1255
f11459ad 1256 failed_super:
a95161aa 1257 deactivate_locked_super(s);
783f6184 1258
348fe8da
RK
1259 failed:
1260 if (!s_new)
d4d77629 1261 blkdev_put(sd.bdev, mode);
e4c59d61 1262 return ERR_PTR(err);
783f6184
RK
1263}
1264
783f6184
RK
1265struct file_system_type nilfs_fs_type = {
1266 .owner = THIS_MODULE,
1267 .name = "nilfs2",
e4c59d61 1268 .mount = nilfs_mount,
783f6184
RK
1269 .kill_sb = kill_block_super,
1270 .fs_flags = FS_REQUIRES_DEV,
1271};
1272
41c88bd7 1273static void nilfs_inode_init_once(void *obj)
783f6184 1274{
41c88bd7 1275 struct nilfs_inode_info *ii = obj;
783f6184 1276
41c88bd7
LH
1277 INIT_LIST_HEAD(&ii->i_dirty);
1278#ifdef CONFIG_NILFS_XATTR
1279 init_rwsem(&ii->xattr_sem);
1280#endif
1281 nilfs_btnode_cache_init_once(&ii->i_btnode_cache);
05d0e94b 1282 ii->i_bmap = &ii->i_bmap_data;
41c88bd7
LH
1283 inode_init_once(&ii->vfs_inode);
1284}
783f6184 1285
41c88bd7
LH
1286static void nilfs_segbuf_init_once(void *obj)
1287{
1288 memset(obj, 0, sizeof(struct nilfs_segment_buffer));
1289}
783f6184 1290
41c88bd7
LH
1291static void nilfs_destroy_cachep(void)
1292{
84cb0999 1293 if (nilfs_inode_cachep)
41c88bd7 1294 kmem_cache_destroy(nilfs_inode_cachep);
84cb0999 1295 if (nilfs_transaction_cachep)
41c88bd7 1296 kmem_cache_destroy(nilfs_transaction_cachep);
84cb0999 1297 if (nilfs_segbuf_cachep)
41c88bd7 1298 kmem_cache_destroy(nilfs_segbuf_cachep);
84cb0999 1299 if (nilfs_btree_path_cache)
41c88bd7
LH
1300 kmem_cache_destroy(nilfs_btree_path_cache);
1301}
783f6184 1302
41c88bd7
LH
1303static int __init nilfs_init_cachep(void)
1304{
1305 nilfs_inode_cachep = kmem_cache_create("nilfs2_inode_cache",
1306 sizeof(struct nilfs_inode_info), 0,
1307 SLAB_RECLAIM_ACCOUNT, nilfs_inode_init_once);
1308 if (!nilfs_inode_cachep)
1309 goto fail;
1310
1311 nilfs_transaction_cachep = kmem_cache_create("nilfs2_transaction_cache",
1312 sizeof(struct nilfs_transaction_info), 0,
1313 SLAB_RECLAIM_ACCOUNT, NULL);
1314 if (!nilfs_transaction_cachep)
1315 goto fail;
1316
1317 nilfs_segbuf_cachep = kmem_cache_create("nilfs2_segbuf_cache",
1318 sizeof(struct nilfs_segment_buffer), 0,
1319 SLAB_RECLAIM_ACCOUNT, nilfs_segbuf_init_once);
1320 if (!nilfs_segbuf_cachep)
1321 goto fail;
1322
1323 nilfs_btree_path_cache = kmem_cache_create("nilfs2_btree_path_cache",
1324 sizeof(struct nilfs_btree_path) * NILFS_BTREE_LEVEL_MAX,
1325 0, 0, NULL);
1326 if (!nilfs_btree_path_cache)
1327 goto fail;
783f6184
RK
1328
1329 return 0;
1330
41c88bd7
LH
1331fail:
1332 nilfs_destroy_cachep();
1333 return -ENOMEM;
1334}
1335
1336static int __init init_nilfs_fs(void)
1337{
1338 int err;
783f6184 1339
41c88bd7
LH
1340 err = nilfs_init_cachep();
1341 if (err)
1342 goto fail;
783f6184 1343
41c88bd7
LH
1344 err = register_filesystem(&nilfs_fs_type);
1345 if (err)
1346 goto free_cachep;
783f6184 1347
9f130263 1348 printk(KERN_INFO "NILFS version 2 loaded\n");
41c88bd7 1349 return 0;
783f6184 1350
41c88bd7
LH
1351free_cachep:
1352 nilfs_destroy_cachep();
1353fail:
783f6184
RK
1354 return err;
1355}
1356
1357static void __exit exit_nilfs_fs(void)
1358{
41c88bd7 1359 nilfs_destroy_cachep();
783f6184
RK
1360 unregister_filesystem(&nilfs_fs_type);
1361}
1362
1363module_init(init_nilfs_fs)
1364module_exit(exit_nilfs_fs)