]> git.proxmox.com Git - mirror_ubuntu-artful-kernel.git/blob - fs/ext2/super.c
UBUNTU: Ubuntu-4.13.0-45.50
[mirror_ubuntu-artful-kernel.git] / fs / ext2 / super.c
1 /*
2 * linux/fs/ext2/super.c
3 *
4 * Copyright (C) 1992, 1993, 1994, 1995
5 * Remy Card (card@masi.ibp.fr)
6 * Laboratoire MASI - Institut Blaise Pascal
7 * Universite Pierre et Marie Curie (Paris VI)
8 *
9 * from
10 *
11 * linux/fs/minix/inode.c
12 *
13 * Copyright (C) 1991, 1992 Linus Torvalds
14 *
15 * Big-endian to little-endian byte-swapping/bitmaps by
16 * David S. Miller (davem@caip.rutgers.edu), 1995
17 */
18
19 #include <linux/module.h>
20 #include <linux/string.h>
21 #include <linux/fs.h>
22 #include <linux/slab.h>
23 #include <linux/init.h>
24 #include <linux/blkdev.h>
25 #include <linux/parser.h>
26 #include <linux/random.h>
27 #include <linux/buffer_head.h>
28 #include <linux/exportfs.h>
29 #include <linux/vfs.h>
30 #include <linux/seq_file.h>
31 #include <linux/mount.h>
32 #include <linux/log2.h>
33 #include <linux/quotaops.h>
34 #include <linux/uaccess.h>
35 #include <linux/dax.h>
36 #include "ext2.h"
37 #include "xattr.h"
38 #include "acl.h"
39
40 static void ext2_write_super(struct super_block *sb);
41 static int ext2_remount (struct super_block * sb, int * flags, char * data);
42 static int ext2_statfs (struct dentry * dentry, struct kstatfs * buf);
43 static int ext2_sync_fs(struct super_block *sb, int wait);
44 static int ext2_freeze(struct super_block *sb);
45 static int ext2_unfreeze(struct super_block *sb);
46
47 void ext2_error(struct super_block *sb, const char *function,
48 const char *fmt, ...)
49 {
50 struct va_format vaf;
51 va_list args;
52 struct ext2_sb_info *sbi = EXT2_SB(sb);
53 struct ext2_super_block *es = sbi->s_es;
54
55 if (!(sb->s_flags & MS_RDONLY)) {
56 spin_lock(&sbi->s_lock);
57 sbi->s_mount_state |= EXT2_ERROR_FS;
58 es->s_state |= cpu_to_le16(EXT2_ERROR_FS);
59 spin_unlock(&sbi->s_lock);
60 ext2_sync_super(sb, es, 1);
61 }
62
63 va_start(args, fmt);
64
65 vaf.fmt = fmt;
66 vaf.va = &args;
67
68 printk(KERN_CRIT "EXT2-fs (%s): error: %s: %pV\n",
69 sb->s_id, function, &vaf);
70
71 va_end(args);
72
73 if (test_opt(sb, ERRORS_PANIC))
74 panic("EXT2-fs: panic from previous error\n");
75 if (test_opt(sb, ERRORS_RO)) {
76 ext2_msg(sb, KERN_CRIT,
77 "error: remounting filesystem read-only");
78 sb->s_flags |= MS_RDONLY;
79 }
80 }
81
82 void ext2_msg(struct super_block *sb, const char *prefix,
83 const char *fmt, ...)
84 {
85 struct va_format vaf;
86 va_list args;
87
88 va_start(args, fmt);
89
90 vaf.fmt = fmt;
91 vaf.va = &args;
92
93 printk("%sEXT2-fs (%s): %pV\n", prefix, sb->s_id, &vaf);
94
95 va_end(args);
96 }
97
98 /*
99 * This must be called with sbi->s_lock held.
100 */
101 void ext2_update_dynamic_rev(struct super_block *sb)
102 {
103 struct ext2_super_block *es = EXT2_SB(sb)->s_es;
104
105 if (le32_to_cpu(es->s_rev_level) > EXT2_GOOD_OLD_REV)
106 return;
107
108 ext2_msg(sb, KERN_WARNING,
109 "warning: updating to rev %d because of "
110 "new feature flag, running e2fsck is recommended",
111 EXT2_DYNAMIC_REV);
112
113 es->s_first_ino = cpu_to_le32(EXT2_GOOD_OLD_FIRST_INO);
114 es->s_inode_size = cpu_to_le16(EXT2_GOOD_OLD_INODE_SIZE);
115 es->s_rev_level = cpu_to_le32(EXT2_DYNAMIC_REV);
116 /* leave es->s_feature_*compat flags alone */
117 /* es->s_uuid will be set by e2fsck if empty */
118
119 /*
120 * The rest of the superblock fields should be zero, and if not it
121 * means they are likely already in use, so leave them alone. We
122 * can leave it up to e2fsck to clean up any inconsistencies there.
123 */
124 }
125
126 #ifdef CONFIG_QUOTA
127 static int ext2_quota_off(struct super_block *sb, int type);
128
129 static void ext2_quota_off_umount(struct super_block *sb)
130 {
131 int type;
132
133 for (type = 0; type < MAXQUOTAS; type++)
134 ext2_quota_off(sb, type);
135 }
136 #else
137 static inline void ext2_quota_off_umount(struct super_block *sb)
138 {
139 }
140 #endif
141
142 static void ext2_put_super (struct super_block * sb)
143 {
144 int db_count;
145 int i;
146 struct ext2_sb_info *sbi = EXT2_SB(sb);
147
148 ext2_quota_off_umount(sb);
149
150 if (sbi->s_ea_block_cache) {
151 ext2_xattr_destroy_cache(sbi->s_ea_block_cache);
152 sbi->s_ea_block_cache = NULL;
153 }
154 if (!(sb->s_flags & MS_RDONLY)) {
155 struct ext2_super_block *es = sbi->s_es;
156
157 spin_lock(&sbi->s_lock);
158 es->s_state = cpu_to_le16(sbi->s_mount_state);
159 spin_unlock(&sbi->s_lock);
160 ext2_sync_super(sb, es, 1);
161 }
162 db_count = sbi->s_gdb_count;
163 for (i = 0; i < db_count; i++)
164 if (sbi->s_group_desc[i])
165 brelse (sbi->s_group_desc[i]);
166 kfree(sbi->s_group_desc);
167 kfree(sbi->s_debts);
168 percpu_counter_destroy(&sbi->s_freeblocks_counter);
169 percpu_counter_destroy(&sbi->s_freeinodes_counter);
170 percpu_counter_destroy(&sbi->s_dirs_counter);
171 brelse (sbi->s_sbh);
172 sb->s_fs_info = NULL;
173 kfree(sbi->s_blockgroup_lock);
174 kfree(sbi);
175 }
176
177 static struct kmem_cache * ext2_inode_cachep;
178
179 static struct inode *ext2_alloc_inode(struct super_block *sb)
180 {
181 struct ext2_inode_info *ei;
182 ei = kmem_cache_alloc(ext2_inode_cachep, GFP_KERNEL);
183 if (!ei)
184 return NULL;
185 ei->i_block_alloc_info = NULL;
186 ei->vfs_inode.i_version = 1;
187 #ifdef CONFIG_QUOTA
188 memset(&ei->i_dquot, 0, sizeof(ei->i_dquot));
189 #endif
190
191 return &ei->vfs_inode;
192 }
193
194 static void ext2_i_callback(struct rcu_head *head)
195 {
196 struct inode *inode = container_of(head, struct inode, i_rcu);
197 kmem_cache_free(ext2_inode_cachep, EXT2_I(inode));
198 }
199
200 static void ext2_destroy_inode(struct inode *inode)
201 {
202 call_rcu(&inode->i_rcu, ext2_i_callback);
203 }
204
205 static void init_once(void *foo)
206 {
207 struct ext2_inode_info *ei = (struct ext2_inode_info *) foo;
208
209 rwlock_init(&ei->i_meta_lock);
210 #ifdef CONFIG_EXT2_FS_XATTR
211 init_rwsem(&ei->xattr_sem);
212 #endif
213 mutex_init(&ei->truncate_mutex);
214 #ifdef CONFIG_FS_DAX
215 init_rwsem(&ei->dax_sem);
216 #endif
217 inode_init_once(&ei->vfs_inode);
218 }
219
220 static int __init init_inodecache(void)
221 {
222 ext2_inode_cachep = kmem_cache_create("ext2_inode_cache",
223 sizeof(struct ext2_inode_info),
224 0, (SLAB_RECLAIM_ACCOUNT|
225 SLAB_MEM_SPREAD|SLAB_ACCOUNT),
226 init_once);
227 if (ext2_inode_cachep == NULL)
228 return -ENOMEM;
229 return 0;
230 }
231
232 static void destroy_inodecache(void)
233 {
234 /*
235 * Make sure all delayed rcu free inodes are flushed before we
236 * destroy cache.
237 */
238 rcu_barrier();
239 kmem_cache_destroy(ext2_inode_cachep);
240 }
241
242 static int ext2_show_options(struct seq_file *seq, struct dentry *root)
243 {
244 struct super_block *sb = root->d_sb;
245 struct ext2_sb_info *sbi = EXT2_SB(sb);
246 struct ext2_super_block *es = sbi->s_es;
247 unsigned long def_mount_opts;
248
249 spin_lock(&sbi->s_lock);
250 def_mount_opts = le32_to_cpu(es->s_default_mount_opts);
251
252 if (sbi->s_sb_block != 1)
253 seq_printf(seq, ",sb=%lu", sbi->s_sb_block);
254 if (test_opt(sb, MINIX_DF))
255 seq_puts(seq, ",minixdf");
256 if (test_opt(sb, GRPID))
257 seq_puts(seq, ",grpid");
258 if (!test_opt(sb, GRPID) && (def_mount_opts & EXT2_DEFM_BSDGROUPS))
259 seq_puts(seq, ",nogrpid");
260 if (!uid_eq(sbi->s_resuid, make_kuid(&init_user_ns, EXT2_DEF_RESUID)) ||
261 le16_to_cpu(es->s_def_resuid) != EXT2_DEF_RESUID) {
262 seq_printf(seq, ",resuid=%u",
263 from_kuid_munged(&init_user_ns, sbi->s_resuid));
264 }
265 if (!gid_eq(sbi->s_resgid, make_kgid(&init_user_ns, EXT2_DEF_RESGID)) ||
266 le16_to_cpu(es->s_def_resgid) != EXT2_DEF_RESGID) {
267 seq_printf(seq, ",resgid=%u",
268 from_kgid_munged(&init_user_ns, sbi->s_resgid));
269 }
270 if (test_opt(sb, ERRORS_RO)) {
271 int def_errors = le16_to_cpu(es->s_errors);
272
273 if (def_errors == EXT2_ERRORS_PANIC ||
274 def_errors == EXT2_ERRORS_CONTINUE) {
275 seq_puts(seq, ",errors=remount-ro");
276 }
277 }
278 if (test_opt(sb, ERRORS_CONT))
279 seq_puts(seq, ",errors=continue");
280 if (test_opt(sb, ERRORS_PANIC))
281 seq_puts(seq, ",errors=panic");
282 if (test_opt(sb, NO_UID32))
283 seq_puts(seq, ",nouid32");
284 if (test_opt(sb, DEBUG))
285 seq_puts(seq, ",debug");
286 if (test_opt(sb, OLDALLOC))
287 seq_puts(seq, ",oldalloc");
288
289 #ifdef CONFIG_EXT2_FS_XATTR
290 if (test_opt(sb, XATTR_USER))
291 seq_puts(seq, ",user_xattr");
292 if (!test_opt(sb, XATTR_USER) &&
293 (def_mount_opts & EXT2_DEFM_XATTR_USER)) {
294 seq_puts(seq, ",nouser_xattr");
295 }
296 #endif
297
298 #ifdef CONFIG_EXT2_FS_POSIX_ACL
299 if (test_opt(sb, POSIX_ACL))
300 seq_puts(seq, ",acl");
301 if (!test_opt(sb, POSIX_ACL) && (def_mount_opts & EXT2_DEFM_ACL))
302 seq_puts(seq, ",noacl");
303 #endif
304
305 if (test_opt(sb, NOBH))
306 seq_puts(seq, ",nobh");
307
308 #if defined(CONFIG_QUOTA)
309 if (sbi->s_mount_opt & EXT2_MOUNT_USRQUOTA)
310 seq_puts(seq, ",usrquota");
311
312 if (sbi->s_mount_opt & EXT2_MOUNT_GRPQUOTA)
313 seq_puts(seq, ",grpquota");
314 #endif
315
316 #ifdef CONFIG_FS_DAX
317 if (sbi->s_mount_opt & EXT2_MOUNT_XIP)
318 seq_puts(seq, ",xip");
319 if (sbi->s_mount_opt & EXT2_MOUNT_DAX)
320 seq_puts(seq, ",dax");
321 #endif
322
323 if (!test_opt(sb, RESERVATION))
324 seq_puts(seq, ",noreservation");
325
326 spin_unlock(&sbi->s_lock);
327 return 0;
328 }
329
330 #ifdef CONFIG_QUOTA
331 static ssize_t ext2_quota_read(struct super_block *sb, int type, char *data, size_t len, loff_t off);
332 static ssize_t ext2_quota_write(struct super_block *sb, int type, const char *data, size_t len, loff_t off);
333 static int ext2_quota_on(struct super_block *sb, int type, int format_id,
334 const struct path *path);
335 static struct dquot **ext2_get_dquots(struct inode *inode)
336 {
337 return EXT2_I(inode)->i_dquot;
338 }
339
340 static const struct quotactl_ops ext2_quotactl_ops = {
341 .quota_on = ext2_quota_on,
342 .quota_off = ext2_quota_off,
343 .quota_sync = dquot_quota_sync,
344 .get_state = dquot_get_state,
345 .set_info = dquot_set_dqinfo,
346 .get_dqblk = dquot_get_dqblk,
347 .set_dqblk = dquot_set_dqblk,
348 .get_nextdqblk = dquot_get_next_dqblk,
349 };
350 #endif
351
352 static const struct super_operations ext2_sops = {
353 .alloc_inode = ext2_alloc_inode,
354 .destroy_inode = ext2_destroy_inode,
355 .write_inode = ext2_write_inode,
356 .evict_inode = ext2_evict_inode,
357 .put_super = ext2_put_super,
358 .sync_fs = ext2_sync_fs,
359 .freeze_fs = ext2_freeze,
360 .unfreeze_fs = ext2_unfreeze,
361 .statfs = ext2_statfs,
362 .remount_fs = ext2_remount,
363 .show_options = ext2_show_options,
364 #ifdef CONFIG_QUOTA
365 .quota_read = ext2_quota_read,
366 .quota_write = ext2_quota_write,
367 .get_dquots = ext2_get_dquots,
368 #endif
369 };
370
371 static struct inode *ext2_nfs_get_inode(struct super_block *sb,
372 u64 ino, u32 generation)
373 {
374 struct inode *inode;
375
376 if (ino < EXT2_FIRST_INO(sb) && ino != EXT2_ROOT_INO)
377 return ERR_PTR(-ESTALE);
378 if (ino > le32_to_cpu(EXT2_SB(sb)->s_es->s_inodes_count))
379 return ERR_PTR(-ESTALE);
380
381 /*
382 * ext2_iget isn't quite right if the inode is currently unallocated!
383 * However ext2_iget currently does appropriate checks to handle stale
384 * inodes so everything is OK.
385 */
386 inode = ext2_iget(sb, ino);
387 if (IS_ERR(inode))
388 return ERR_CAST(inode);
389 if (generation && inode->i_generation != generation) {
390 /* we didn't find the right inode.. */
391 iput(inode);
392 return ERR_PTR(-ESTALE);
393 }
394 return inode;
395 }
396
397 static struct dentry *ext2_fh_to_dentry(struct super_block *sb, struct fid *fid,
398 int fh_len, int fh_type)
399 {
400 return generic_fh_to_dentry(sb, fid, fh_len, fh_type,
401 ext2_nfs_get_inode);
402 }
403
404 static struct dentry *ext2_fh_to_parent(struct super_block *sb, struct fid *fid,
405 int fh_len, int fh_type)
406 {
407 return generic_fh_to_parent(sb, fid, fh_len, fh_type,
408 ext2_nfs_get_inode);
409 }
410
411 static const struct export_operations ext2_export_ops = {
412 .fh_to_dentry = ext2_fh_to_dentry,
413 .fh_to_parent = ext2_fh_to_parent,
414 .get_parent = ext2_get_parent,
415 };
416
417 static unsigned long get_sb_block(void **data)
418 {
419 unsigned long sb_block;
420 char *options = (char *) *data;
421
422 if (!options || strncmp(options, "sb=", 3) != 0)
423 return 1; /* Default location */
424 options += 3;
425 sb_block = simple_strtoul(options, &options, 0);
426 if (*options && *options != ',') {
427 printk("EXT2-fs: Invalid sb specification: %s\n",
428 (char *) *data);
429 return 1;
430 }
431 if (*options == ',')
432 options++;
433 *data = (void *) options;
434 return sb_block;
435 }
436
437 enum {
438 Opt_bsd_df, Opt_minix_df, Opt_grpid, Opt_nogrpid,
439 Opt_resgid, Opt_resuid, Opt_sb, Opt_err_cont, Opt_err_panic,
440 Opt_err_ro, Opt_nouid32, Opt_nocheck, Opt_debug,
441 Opt_oldalloc, Opt_orlov, Opt_nobh, Opt_user_xattr, Opt_nouser_xattr,
442 Opt_acl, Opt_noacl, Opt_xip, Opt_dax, Opt_ignore, Opt_err, Opt_quota,
443 Opt_usrquota, Opt_grpquota, Opt_reservation, Opt_noreservation
444 };
445
446 static const match_table_t tokens = {
447 {Opt_bsd_df, "bsddf"},
448 {Opt_minix_df, "minixdf"},
449 {Opt_grpid, "grpid"},
450 {Opt_grpid, "bsdgroups"},
451 {Opt_nogrpid, "nogrpid"},
452 {Opt_nogrpid, "sysvgroups"},
453 {Opt_resgid, "resgid=%u"},
454 {Opt_resuid, "resuid=%u"},
455 {Opt_sb, "sb=%u"},
456 {Opt_err_cont, "errors=continue"},
457 {Opt_err_panic, "errors=panic"},
458 {Opt_err_ro, "errors=remount-ro"},
459 {Opt_nouid32, "nouid32"},
460 {Opt_nocheck, "check=none"},
461 {Opt_nocheck, "nocheck"},
462 {Opt_debug, "debug"},
463 {Opt_oldalloc, "oldalloc"},
464 {Opt_orlov, "orlov"},
465 {Opt_nobh, "nobh"},
466 {Opt_user_xattr, "user_xattr"},
467 {Opt_nouser_xattr, "nouser_xattr"},
468 {Opt_acl, "acl"},
469 {Opt_noacl, "noacl"},
470 {Opt_xip, "xip"},
471 {Opt_dax, "dax"},
472 {Opt_grpquota, "grpquota"},
473 {Opt_ignore, "noquota"},
474 {Opt_quota, "quota"},
475 {Opt_usrquota, "usrquota"},
476 {Opt_reservation, "reservation"},
477 {Opt_noreservation, "noreservation"},
478 {Opt_err, NULL}
479 };
480
481 static int parse_options(char *options, struct super_block *sb)
482 {
483 char *p;
484 struct ext2_sb_info *sbi = EXT2_SB(sb);
485 substring_t args[MAX_OPT_ARGS];
486 int option;
487 kuid_t uid;
488 kgid_t gid;
489
490 if (!options)
491 return 1;
492
493 while ((p = strsep (&options, ",")) != NULL) {
494 int token;
495 if (!*p)
496 continue;
497
498 token = match_token(p, tokens, args);
499 switch (token) {
500 case Opt_bsd_df:
501 clear_opt (sbi->s_mount_opt, MINIX_DF);
502 break;
503 case Opt_minix_df:
504 set_opt (sbi->s_mount_opt, MINIX_DF);
505 break;
506 case Opt_grpid:
507 set_opt (sbi->s_mount_opt, GRPID);
508 break;
509 case Opt_nogrpid:
510 clear_opt (sbi->s_mount_opt, GRPID);
511 break;
512 case Opt_resuid:
513 if (match_int(&args[0], &option))
514 return 0;
515 uid = make_kuid(current_user_ns(), option);
516 if (!uid_valid(uid)) {
517 ext2_msg(sb, KERN_ERR, "Invalid uid value %d", option);
518 return 0;
519
520 }
521 sbi->s_resuid = uid;
522 break;
523 case Opt_resgid:
524 if (match_int(&args[0], &option))
525 return 0;
526 gid = make_kgid(current_user_ns(), option);
527 if (!gid_valid(gid)) {
528 ext2_msg(sb, KERN_ERR, "Invalid gid value %d", option);
529 return 0;
530 }
531 sbi->s_resgid = gid;
532 break;
533 case Opt_sb:
534 /* handled by get_sb_block() instead of here */
535 /* *sb_block = match_int(&args[0]); */
536 break;
537 case Opt_err_panic:
538 clear_opt (sbi->s_mount_opt, ERRORS_CONT);
539 clear_opt (sbi->s_mount_opt, ERRORS_RO);
540 set_opt (sbi->s_mount_opt, ERRORS_PANIC);
541 break;
542 case Opt_err_ro:
543 clear_opt (sbi->s_mount_opt, ERRORS_CONT);
544 clear_opt (sbi->s_mount_opt, ERRORS_PANIC);
545 set_opt (sbi->s_mount_opt, ERRORS_RO);
546 break;
547 case Opt_err_cont:
548 clear_opt (sbi->s_mount_opt, ERRORS_RO);
549 clear_opt (sbi->s_mount_opt, ERRORS_PANIC);
550 set_opt (sbi->s_mount_opt, ERRORS_CONT);
551 break;
552 case Opt_nouid32:
553 set_opt (sbi->s_mount_opt, NO_UID32);
554 break;
555 case Opt_nocheck:
556 clear_opt (sbi->s_mount_opt, CHECK);
557 break;
558 case Opt_debug:
559 set_opt (sbi->s_mount_opt, DEBUG);
560 break;
561 case Opt_oldalloc:
562 set_opt (sbi->s_mount_opt, OLDALLOC);
563 break;
564 case Opt_orlov:
565 clear_opt (sbi->s_mount_opt, OLDALLOC);
566 break;
567 case Opt_nobh:
568 set_opt (sbi->s_mount_opt, NOBH);
569 break;
570 #ifdef CONFIG_EXT2_FS_XATTR
571 case Opt_user_xattr:
572 set_opt (sbi->s_mount_opt, XATTR_USER);
573 break;
574 case Opt_nouser_xattr:
575 clear_opt (sbi->s_mount_opt, XATTR_USER);
576 break;
577 #else
578 case Opt_user_xattr:
579 case Opt_nouser_xattr:
580 ext2_msg(sb, KERN_INFO, "(no)user_xattr options"
581 "not supported");
582 break;
583 #endif
584 #ifdef CONFIG_EXT2_FS_POSIX_ACL
585 case Opt_acl:
586 set_opt(sbi->s_mount_opt, POSIX_ACL);
587 break;
588 case Opt_noacl:
589 clear_opt(sbi->s_mount_opt, POSIX_ACL);
590 break;
591 #else
592 case Opt_acl:
593 case Opt_noacl:
594 ext2_msg(sb, KERN_INFO,
595 "(no)acl options not supported");
596 break;
597 #endif
598 case Opt_xip:
599 ext2_msg(sb, KERN_INFO, "use dax instead of xip");
600 set_opt(sbi->s_mount_opt, XIP);
601 /* Fall through */
602 case Opt_dax:
603 #ifdef CONFIG_FS_DAX
604 ext2_msg(sb, KERN_WARNING,
605 "DAX enabled. Warning: EXPERIMENTAL, use at your own risk");
606 set_opt(sbi->s_mount_opt, DAX);
607 #else
608 ext2_msg(sb, KERN_INFO, "dax option not supported");
609 #endif
610 break;
611
612 #if defined(CONFIG_QUOTA)
613 case Opt_quota:
614 case Opt_usrquota:
615 set_opt(sbi->s_mount_opt, USRQUOTA);
616 break;
617
618 case Opt_grpquota:
619 set_opt(sbi->s_mount_opt, GRPQUOTA);
620 break;
621 #else
622 case Opt_quota:
623 case Opt_usrquota:
624 case Opt_grpquota:
625 ext2_msg(sb, KERN_INFO,
626 "quota operations not supported");
627 break;
628 #endif
629
630 case Opt_reservation:
631 set_opt(sbi->s_mount_opt, RESERVATION);
632 ext2_msg(sb, KERN_INFO, "reservations ON");
633 break;
634 case Opt_noreservation:
635 clear_opt(sbi->s_mount_opt, RESERVATION);
636 ext2_msg(sb, KERN_INFO, "reservations OFF");
637 break;
638 case Opt_ignore:
639 break;
640 default:
641 return 0;
642 }
643 }
644 return 1;
645 }
646
647 static int ext2_setup_super (struct super_block * sb,
648 struct ext2_super_block * es,
649 int read_only)
650 {
651 int res = 0;
652 struct ext2_sb_info *sbi = EXT2_SB(sb);
653
654 if (le32_to_cpu(es->s_rev_level) > EXT2_MAX_SUPP_REV) {
655 ext2_msg(sb, KERN_ERR,
656 "error: revision level too high, "
657 "forcing read-only mode");
658 res = MS_RDONLY;
659 }
660 if (read_only)
661 return res;
662 if (!(sbi->s_mount_state & EXT2_VALID_FS))
663 ext2_msg(sb, KERN_WARNING,
664 "warning: mounting unchecked fs, "
665 "running e2fsck is recommended");
666 else if ((sbi->s_mount_state & EXT2_ERROR_FS))
667 ext2_msg(sb, KERN_WARNING,
668 "warning: mounting fs with errors, "
669 "running e2fsck is recommended");
670 else if ((__s16) le16_to_cpu(es->s_max_mnt_count) >= 0 &&
671 le16_to_cpu(es->s_mnt_count) >=
672 (unsigned short) (__s16) le16_to_cpu(es->s_max_mnt_count))
673 ext2_msg(sb, KERN_WARNING,
674 "warning: maximal mount count reached, "
675 "running e2fsck is recommended");
676 else if (le32_to_cpu(es->s_checkinterval) &&
677 (le32_to_cpu(es->s_lastcheck) +
678 le32_to_cpu(es->s_checkinterval) <= get_seconds()))
679 ext2_msg(sb, KERN_WARNING,
680 "warning: checktime reached, "
681 "running e2fsck is recommended");
682 if (!le16_to_cpu(es->s_max_mnt_count))
683 es->s_max_mnt_count = cpu_to_le16(EXT2_DFL_MAX_MNT_COUNT);
684 le16_add_cpu(&es->s_mnt_count, 1);
685 if (test_opt (sb, DEBUG))
686 ext2_msg(sb, KERN_INFO, "%s, %s, bs=%lu, fs=%lu, gc=%lu, "
687 "bpg=%lu, ipg=%lu, mo=%04lx]",
688 EXT2FS_VERSION, EXT2FS_DATE, sb->s_blocksize,
689 sbi->s_frag_size,
690 sbi->s_groups_count,
691 EXT2_BLOCKS_PER_GROUP(sb),
692 EXT2_INODES_PER_GROUP(sb),
693 sbi->s_mount_opt);
694 return res;
695 }
696
697 static int ext2_check_descriptors(struct super_block *sb)
698 {
699 int i;
700 struct ext2_sb_info *sbi = EXT2_SB(sb);
701
702 ext2_debug ("Checking group descriptors");
703
704 for (i = 0; i < sbi->s_groups_count; i++) {
705 struct ext2_group_desc *gdp = ext2_get_group_desc(sb, i, NULL);
706 ext2_fsblk_t first_block = ext2_group_first_block_no(sb, i);
707 ext2_fsblk_t last_block;
708
709 if (i == sbi->s_groups_count - 1)
710 last_block = le32_to_cpu(sbi->s_es->s_blocks_count) - 1;
711 else
712 last_block = first_block +
713 (EXT2_BLOCKS_PER_GROUP(sb) - 1);
714
715 if (le32_to_cpu(gdp->bg_block_bitmap) < first_block ||
716 le32_to_cpu(gdp->bg_block_bitmap) > last_block)
717 {
718 ext2_error (sb, "ext2_check_descriptors",
719 "Block bitmap for group %d"
720 " not in group (block %lu)!",
721 i, (unsigned long) le32_to_cpu(gdp->bg_block_bitmap));
722 return 0;
723 }
724 if (le32_to_cpu(gdp->bg_inode_bitmap) < first_block ||
725 le32_to_cpu(gdp->bg_inode_bitmap) > last_block)
726 {
727 ext2_error (sb, "ext2_check_descriptors",
728 "Inode bitmap for group %d"
729 " not in group (block %lu)!",
730 i, (unsigned long) le32_to_cpu(gdp->bg_inode_bitmap));
731 return 0;
732 }
733 if (le32_to_cpu(gdp->bg_inode_table) < first_block ||
734 le32_to_cpu(gdp->bg_inode_table) + sbi->s_itb_per_group - 1 >
735 last_block)
736 {
737 ext2_error (sb, "ext2_check_descriptors",
738 "Inode table for group %d"
739 " not in group (block %lu)!",
740 i, (unsigned long) le32_to_cpu(gdp->bg_inode_table));
741 return 0;
742 }
743 }
744 return 1;
745 }
746
747 /*
748 * Maximal file size. There is a direct, and {,double-,triple-}indirect
749 * block limit, and also a limit of (2^32 - 1) 512-byte sectors in i_blocks.
750 * We need to be 1 filesystem block less than the 2^32 sector limit.
751 */
752 static loff_t ext2_max_size(int bits)
753 {
754 loff_t res = EXT2_NDIR_BLOCKS;
755 int meta_blocks;
756 loff_t upper_limit;
757
758 /* This is calculated to be the largest file size for a
759 * dense, file such that the total number of
760 * sectors in the file, including data and all indirect blocks,
761 * does not exceed 2^32 -1
762 * __u32 i_blocks representing the total number of
763 * 512 bytes blocks of the file
764 */
765 upper_limit = (1LL << 32) - 1;
766
767 /* total blocks in file system block size */
768 upper_limit >>= (bits - 9);
769
770
771 /* indirect blocks */
772 meta_blocks = 1;
773 /* double indirect blocks */
774 meta_blocks += 1 + (1LL << (bits-2));
775 /* tripple indirect blocks */
776 meta_blocks += 1 + (1LL << (bits-2)) + (1LL << (2*(bits-2)));
777
778 upper_limit -= meta_blocks;
779 upper_limit <<= bits;
780
781 res += 1LL << (bits-2);
782 res += 1LL << (2*(bits-2));
783 res += 1LL << (3*(bits-2));
784 res <<= bits;
785 if (res > upper_limit)
786 res = upper_limit;
787
788 if (res > MAX_LFS_FILESIZE)
789 res = MAX_LFS_FILESIZE;
790
791 return res;
792 }
793
794 static unsigned long descriptor_loc(struct super_block *sb,
795 unsigned long logic_sb_block,
796 int nr)
797 {
798 struct ext2_sb_info *sbi = EXT2_SB(sb);
799 unsigned long bg, first_meta_bg;
800 int has_super = 0;
801
802 first_meta_bg = le32_to_cpu(sbi->s_es->s_first_meta_bg);
803
804 if (!EXT2_HAS_INCOMPAT_FEATURE(sb, EXT2_FEATURE_INCOMPAT_META_BG) ||
805 nr < first_meta_bg)
806 return (logic_sb_block + nr + 1);
807 bg = sbi->s_desc_per_block * nr;
808 if (ext2_bg_has_super(sb, bg))
809 has_super = 1;
810
811 return ext2_group_first_block_no(sb, bg) + has_super;
812 }
813
814 static int ext2_fill_super(struct super_block *sb, void *data, int silent)
815 {
816 struct buffer_head * bh;
817 struct ext2_sb_info * sbi;
818 struct ext2_super_block * es;
819 struct inode *root;
820 unsigned long block;
821 unsigned long sb_block = get_sb_block(&data);
822 unsigned long logic_sb_block;
823 unsigned long offset = 0;
824 unsigned long def_mount_opts;
825 long ret = -EINVAL;
826 int blocksize = BLOCK_SIZE;
827 int db_count;
828 int i, j;
829 __le32 features;
830 int err;
831
832 err = -ENOMEM;
833 sbi = kzalloc(sizeof(*sbi), GFP_KERNEL);
834 if (!sbi)
835 goto failed;
836
837 sbi->s_blockgroup_lock =
838 kzalloc(sizeof(struct blockgroup_lock), GFP_KERNEL);
839 if (!sbi->s_blockgroup_lock) {
840 kfree(sbi);
841 goto failed;
842 }
843 sb->s_fs_info = sbi;
844 sbi->s_sb_block = sb_block;
845
846 spin_lock_init(&sbi->s_lock);
847
848 /*
849 * See what the current blocksize for the device is, and
850 * use that as the blocksize. Otherwise (or if the blocksize
851 * is smaller than the default) use the default.
852 * This is important for devices that have a hardware
853 * sectorsize that is larger than the default.
854 */
855 blocksize = sb_min_blocksize(sb, BLOCK_SIZE);
856 if (!blocksize) {
857 ext2_msg(sb, KERN_ERR, "error: unable to set blocksize");
858 goto failed_sbi;
859 }
860
861 /*
862 * If the superblock doesn't start on a hardware sector boundary,
863 * calculate the offset.
864 */
865 if (blocksize != BLOCK_SIZE) {
866 logic_sb_block = (sb_block*BLOCK_SIZE) / blocksize;
867 offset = (sb_block*BLOCK_SIZE) % blocksize;
868 } else {
869 logic_sb_block = sb_block;
870 }
871
872 if (!(bh = sb_bread(sb, logic_sb_block))) {
873 ext2_msg(sb, KERN_ERR, "error: unable to read superblock");
874 goto failed_sbi;
875 }
876 /*
877 * Note: s_es must be initialized as soon as possible because
878 * some ext2 macro-instructions depend on its value
879 */
880 es = (struct ext2_super_block *) (((char *)bh->b_data) + offset);
881 sbi->s_es = es;
882 sb->s_magic = le16_to_cpu(es->s_magic);
883
884 if (sb->s_magic != EXT2_SUPER_MAGIC)
885 goto cantfind_ext2;
886
887 /* Set defaults before we parse the mount options */
888 def_mount_opts = le32_to_cpu(es->s_default_mount_opts);
889 if (def_mount_opts & EXT2_DEFM_DEBUG)
890 set_opt(sbi->s_mount_opt, DEBUG);
891 if (def_mount_opts & EXT2_DEFM_BSDGROUPS)
892 set_opt(sbi->s_mount_opt, GRPID);
893 if (def_mount_opts & EXT2_DEFM_UID16)
894 set_opt(sbi->s_mount_opt, NO_UID32);
895 #ifdef CONFIG_EXT2_FS_XATTR
896 if (def_mount_opts & EXT2_DEFM_XATTR_USER)
897 set_opt(sbi->s_mount_opt, XATTR_USER);
898 #endif
899 #ifdef CONFIG_EXT2_FS_POSIX_ACL
900 if (def_mount_opts & EXT2_DEFM_ACL)
901 set_opt(sbi->s_mount_opt, POSIX_ACL);
902 #endif
903
904 if (le16_to_cpu(sbi->s_es->s_errors) == EXT2_ERRORS_PANIC)
905 set_opt(sbi->s_mount_opt, ERRORS_PANIC);
906 else if (le16_to_cpu(sbi->s_es->s_errors) == EXT2_ERRORS_CONTINUE)
907 set_opt(sbi->s_mount_opt, ERRORS_CONT);
908 else
909 set_opt(sbi->s_mount_opt, ERRORS_RO);
910
911 sbi->s_resuid = make_kuid(&init_user_ns, le16_to_cpu(es->s_def_resuid));
912 sbi->s_resgid = make_kgid(&init_user_ns, le16_to_cpu(es->s_def_resgid));
913
914 set_opt(sbi->s_mount_opt, RESERVATION);
915
916 if (!parse_options((char *) data, sb))
917 goto failed_mount;
918
919 sb->s_flags = (sb->s_flags & ~MS_POSIXACL) |
920 ((EXT2_SB(sb)->s_mount_opt & EXT2_MOUNT_POSIX_ACL) ?
921 MS_POSIXACL : 0);
922 sb->s_iflags |= SB_I_CGROUPWB;
923
924 if (le32_to_cpu(es->s_rev_level) == EXT2_GOOD_OLD_REV &&
925 (EXT2_HAS_COMPAT_FEATURE(sb, ~0U) ||
926 EXT2_HAS_RO_COMPAT_FEATURE(sb, ~0U) ||
927 EXT2_HAS_INCOMPAT_FEATURE(sb, ~0U)))
928 ext2_msg(sb, KERN_WARNING,
929 "warning: feature flags set on rev 0 fs, "
930 "running e2fsck is recommended");
931 /*
932 * Check feature flags regardless of the revision level, since we
933 * previously didn't change the revision level when setting the flags,
934 * so there is a chance incompat flags are set on a rev 0 filesystem.
935 */
936 features = EXT2_HAS_INCOMPAT_FEATURE(sb, ~EXT2_FEATURE_INCOMPAT_SUPP);
937 if (features) {
938 ext2_msg(sb, KERN_ERR, "error: couldn't mount because of "
939 "unsupported optional features (%x)",
940 le32_to_cpu(features));
941 goto failed_mount;
942 }
943 if (!(sb->s_flags & MS_RDONLY) &&
944 (features = EXT2_HAS_RO_COMPAT_FEATURE(sb, ~EXT2_FEATURE_RO_COMPAT_SUPP))){
945 ext2_msg(sb, KERN_ERR, "error: couldn't mount RDWR because of "
946 "unsupported optional features (%x)",
947 le32_to_cpu(features));
948 goto failed_mount;
949 }
950
951 blocksize = BLOCK_SIZE << le32_to_cpu(sbi->s_es->s_log_block_size);
952
953 if (sbi->s_mount_opt & EXT2_MOUNT_DAX) {
954 err = bdev_dax_supported(sb, blocksize);
955 if (err)
956 goto failed_mount;
957 }
958
959 /* If the blocksize doesn't match, re-read the thing.. */
960 if (sb->s_blocksize != blocksize) {
961 brelse(bh);
962
963 if (!sb_set_blocksize(sb, blocksize)) {
964 ext2_msg(sb, KERN_ERR,
965 "error: bad blocksize %d", blocksize);
966 goto failed_sbi;
967 }
968
969 logic_sb_block = (sb_block*BLOCK_SIZE) / blocksize;
970 offset = (sb_block*BLOCK_SIZE) % blocksize;
971 bh = sb_bread(sb, logic_sb_block);
972 if(!bh) {
973 ext2_msg(sb, KERN_ERR, "error: couldn't read"
974 "superblock on 2nd try");
975 goto failed_sbi;
976 }
977 es = (struct ext2_super_block *) (((char *)bh->b_data) + offset);
978 sbi->s_es = es;
979 if (es->s_magic != cpu_to_le16(EXT2_SUPER_MAGIC)) {
980 ext2_msg(sb, KERN_ERR, "error: magic mismatch");
981 goto failed_mount;
982 }
983 }
984
985 sb->s_maxbytes = ext2_max_size(sb->s_blocksize_bits);
986 sb->s_max_links = EXT2_LINK_MAX;
987
988 if (le32_to_cpu(es->s_rev_level) == EXT2_GOOD_OLD_REV) {
989 sbi->s_inode_size = EXT2_GOOD_OLD_INODE_SIZE;
990 sbi->s_first_ino = EXT2_GOOD_OLD_FIRST_INO;
991 } else {
992 sbi->s_inode_size = le16_to_cpu(es->s_inode_size);
993 sbi->s_first_ino = le32_to_cpu(es->s_first_ino);
994 if ((sbi->s_inode_size < EXT2_GOOD_OLD_INODE_SIZE) ||
995 !is_power_of_2(sbi->s_inode_size) ||
996 (sbi->s_inode_size > blocksize)) {
997 ext2_msg(sb, KERN_ERR,
998 "error: unsupported inode size: %d",
999 sbi->s_inode_size);
1000 goto failed_mount;
1001 }
1002 }
1003
1004 sbi->s_frag_size = EXT2_MIN_FRAG_SIZE <<
1005 le32_to_cpu(es->s_log_frag_size);
1006 if (sbi->s_frag_size == 0)
1007 goto cantfind_ext2;
1008 sbi->s_frags_per_block = sb->s_blocksize / sbi->s_frag_size;
1009
1010 sbi->s_blocks_per_group = le32_to_cpu(es->s_blocks_per_group);
1011 sbi->s_frags_per_group = le32_to_cpu(es->s_frags_per_group);
1012 sbi->s_inodes_per_group = le32_to_cpu(es->s_inodes_per_group);
1013
1014 if (EXT2_INODE_SIZE(sb) == 0)
1015 goto cantfind_ext2;
1016 sbi->s_inodes_per_block = sb->s_blocksize / EXT2_INODE_SIZE(sb);
1017 if (sbi->s_inodes_per_block == 0 || sbi->s_inodes_per_group == 0)
1018 goto cantfind_ext2;
1019 sbi->s_itb_per_group = sbi->s_inodes_per_group /
1020 sbi->s_inodes_per_block;
1021 sbi->s_desc_per_block = sb->s_blocksize /
1022 sizeof (struct ext2_group_desc);
1023 sbi->s_sbh = bh;
1024 sbi->s_mount_state = le16_to_cpu(es->s_state);
1025 sbi->s_addr_per_block_bits =
1026 ilog2 (EXT2_ADDR_PER_BLOCK(sb));
1027 sbi->s_desc_per_block_bits =
1028 ilog2 (EXT2_DESC_PER_BLOCK(sb));
1029
1030 if (sb->s_magic != EXT2_SUPER_MAGIC)
1031 goto cantfind_ext2;
1032
1033 if (sb->s_blocksize != bh->b_size) {
1034 if (!silent)
1035 ext2_msg(sb, KERN_ERR, "error: unsupported blocksize");
1036 goto failed_mount;
1037 }
1038
1039 if (sb->s_blocksize != sbi->s_frag_size) {
1040 ext2_msg(sb, KERN_ERR,
1041 "error: fragsize %lu != blocksize %lu"
1042 "(not supported yet)",
1043 sbi->s_frag_size, sb->s_blocksize);
1044 goto failed_mount;
1045 }
1046
1047 if (sbi->s_blocks_per_group > sb->s_blocksize * 8) {
1048 ext2_msg(sb, KERN_ERR,
1049 "error: #blocks per group too big: %lu",
1050 sbi->s_blocks_per_group);
1051 goto failed_mount;
1052 }
1053 if (sbi->s_frags_per_group > sb->s_blocksize * 8) {
1054 ext2_msg(sb, KERN_ERR,
1055 "error: #fragments per group too big: %lu",
1056 sbi->s_frags_per_group);
1057 goto failed_mount;
1058 }
1059 if (sbi->s_inodes_per_group > sb->s_blocksize * 8) {
1060 ext2_msg(sb, KERN_ERR,
1061 "error: #inodes per group too big: %lu",
1062 sbi->s_inodes_per_group);
1063 goto failed_mount;
1064 }
1065
1066 if (EXT2_BLOCKS_PER_GROUP(sb) == 0)
1067 goto cantfind_ext2;
1068 sbi->s_groups_count = ((le32_to_cpu(es->s_blocks_count) -
1069 le32_to_cpu(es->s_first_data_block) - 1)
1070 / EXT2_BLOCKS_PER_GROUP(sb)) + 1;
1071 db_count = (sbi->s_groups_count + EXT2_DESC_PER_BLOCK(sb) - 1) /
1072 EXT2_DESC_PER_BLOCK(sb);
1073 sbi->s_group_desc = kmalloc (db_count * sizeof (struct buffer_head *), GFP_KERNEL);
1074 if (sbi->s_group_desc == NULL) {
1075 ext2_msg(sb, KERN_ERR, "error: not enough memory");
1076 goto failed_mount;
1077 }
1078 bgl_lock_init(sbi->s_blockgroup_lock);
1079 sbi->s_debts = kcalloc(sbi->s_groups_count, sizeof(*sbi->s_debts), GFP_KERNEL);
1080 if (!sbi->s_debts) {
1081 ext2_msg(sb, KERN_ERR, "error: not enough memory");
1082 goto failed_mount_group_desc;
1083 }
1084 for (i = 0; i < db_count; i++) {
1085 block = descriptor_loc(sb, logic_sb_block, i);
1086 sbi->s_group_desc[i] = sb_bread(sb, block);
1087 if (!sbi->s_group_desc[i]) {
1088 for (j = 0; j < i; j++)
1089 brelse (sbi->s_group_desc[j]);
1090 ext2_msg(sb, KERN_ERR,
1091 "error: unable to read group descriptors");
1092 goto failed_mount_group_desc;
1093 }
1094 }
1095 if (!ext2_check_descriptors (sb)) {
1096 ext2_msg(sb, KERN_ERR, "group descriptors corrupted");
1097 goto failed_mount2;
1098 }
1099 sbi->s_gdb_count = db_count;
1100 get_random_bytes(&sbi->s_next_generation, sizeof(u32));
1101 spin_lock_init(&sbi->s_next_gen_lock);
1102
1103 /* per fileystem reservation list head & lock */
1104 spin_lock_init(&sbi->s_rsv_window_lock);
1105 sbi->s_rsv_window_root = RB_ROOT;
1106 /*
1107 * Add a single, static dummy reservation to the start of the
1108 * reservation window list --- it gives us a placeholder for
1109 * append-at-start-of-list which makes the allocation logic
1110 * _much_ simpler.
1111 */
1112 sbi->s_rsv_window_head.rsv_start = EXT2_RESERVE_WINDOW_NOT_ALLOCATED;
1113 sbi->s_rsv_window_head.rsv_end = EXT2_RESERVE_WINDOW_NOT_ALLOCATED;
1114 sbi->s_rsv_window_head.rsv_alloc_hit = 0;
1115 sbi->s_rsv_window_head.rsv_goal_size = 0;
1116 ext2_rsv_window_add(sb, &sbi->s_rsv_window_head);
1117
1118 err = percpu_counter_init(&sbi->s_freeblocks_counter,
1119 ext2_count_free_blocks(sb), GFP_KERNEL);
1120 if (!err) {
1121 err = percpu_counter_init(&sbi->s_freeinodes_counter,
1122 ext2_count_free_inodes(sb), GFP_KERNEL);
1123 }
1124 if (!err) {
1125 err = percpu_counter_init(&sbi->s_dirs_counter,
1126 ext2_count_dirs(sb), GFP_KERNEL);
1127 }
1128 if (err) {
1129 ext2_msg(sb, KERN_ERR, "error: insufficient memory");
1130 goto failed_mount3;
1131 }
1132
1133 #ifdef CONFIG_EXT2_FS_XATTR
1134 sbi->s_ea_block_cache = ext2_xattr_create_cache();
1135 if (!sbi->s_ea_block_cache) {
1136 ext2_msg(sb, KERN_ERR, "Failed to create ea_block_cache");
1137 goto failed_mount3;
1138 }
1139 #endif
1140 /*
1141 * set up enough so that it can read an inode
1142 */
1143 sb->s_op = &ext2_sops;
1144 sb->s_export_op = &ext2_export_ops;
1145 sb->s_xattr = ext2_xattr_handlers;
1146
1147 #ifdef CONFIG_QUOTA
1148 sb->dq_op = &dquot_operations;
1149 sb->s_qcop = &ext2_quotactl_ops;
1150 sb->s_quota_types = QTYPE_MASK_USR | QTYPE_MASK_GRP;
1151 #endif
1152
1153 root = ext2_iget(sb, EXT2_ROOT_INO);
1154 if (IS_ERR(root)) {
1155 ret = PTR_ERR(root);
1156 goto failed_mount3;
1157 }
1158 if (!S_ISDIR(root->i_mode) || !root->i_blocks || !root->i_size) {
1159 iput(root);
1160 ext2_msg(sb, KERN_ERR, "error: corrupt root inode, run e2fsck");
1161 goto failed_mount3;
1162 }
1163
1164 sb->s_root = d_make_root(root);
1165 if (!sb->s_root) {
1166 ext2_msg(sb, KERN_ERR, "error: get root inode failed");
1167 ret = -ENOMEM;
1168 goto failed_mount3;
1169 }
1170 if (EXT2_HAS_COMPAT_FEATURE(sb, EXT3_FEATURE_COMPAT_HAS_JOURNAL))
1171 ext2_msg(sb, KERN_WARNING,
1172 "warning: mounting ext3 filesystem as ext2");
1173 if (ext2_setup_super (sb, es, sb->s_flags & MS_RDONLY))
1174 sb->s_flags |= MS_RDONLY;
1175 ext2_write_super(sb);
1176 return 0;
1177
1178 cantfind_ext2:
1179 if (!silent)
1180 ext2_msg(sb, KERN_ERR,
1181 "error: can't find an ext2 filesystem on dev %s.",
1182 sb->s_id);
1183 goto failed_mount;
1184 failed_mount3:
1185 if (sbi->s_ea_block_cache)
1186 ext2_xattr_destroy_cache(sbi->s_ea_block_cache);
1187 percpu_counter_destroy(&sbi->s_freeblocks_counter);
1188 percpu_counter_destroy(&sbi->s_freeinodes_counter);
1189 percpu_counter_destroy(&sbi->s_dirs_counter);
1190 failed_mount2:
1191 for (i = 0; i < db_count; i++)
1192 brelse(sbi->s_group_desc[i]);
1193 failed_mount_group_desc:
1194 kfree(sbi->s_group_desc);
1195 kfree(sbi->s_debts);
1196 failed_mount:
1197 brelse(bh);
1198 failed_sbi:
1199 sb->s_fs_info = NULL;
1200 kfree(sbi->s_blockgroup_lock);
1201 kfree(sbi);
1202 failed:
1203 return ret;
1204 }
1205
1206 static void ext2_clear_super_error(struct super_block *sb)
1207 {
1208 struct buffer_head *sbh = EXT2_SB(sb)->s_sbh;
1209
1210 if (buffer_write_io_error(sbh)) {
1211 /*
1212 * Oh, dear. A previous attempt to write the
1213 * superblock failed. This could happen because the
1214 * USB device was yanked out. Or it could happen to
1215 * be a transient write error and maybe the block will
1216 * be remapped. Nothing we can do but to retry the
1217 * write and hope for the best.
1218 */
1219 ext2_msg(sb, KERN_ERR,
1220 "previous I/O error to superblock detected\n");
1221 clear_buffer_write_io_error(sbh);
1222 set_buffer_uptodate(sbh);
1223 }
1224 }
1225
1226 void ext2_sync_super(struct super_block *sb, struct ext2_super_block *es,
1227 int wait)
1228 {
1229 ext2_clear_super_error(sb);
1230 spin_lock(&EXT2_SB(sb)->s_lock);
1231 es->s_free_blocks_count = cpu_to_le32(ext2_count_free_blocks(sb));
1232 es->s_free_inodes_count = cpu_to_le32(ext2_count_free_inodes(sb));
1233 es->s_wtime = cpu_to_le32(get_seconds());
1234 /* unlock before we do IO */
1235 spin_unlock(&EXT2_SB(sb)->s_lock);
1236 mark_buffer_dirty(EXT2_SB(sb)->s_sbh);
1237 if (wait)
1238 sync_dirty_buffer(EXT2_SB(sb)->s_sbh);
1239 }
1240
1241 /*
1242 * In the second extended file system, it is not necessary to
1243 * write the super block since we use a mapping of the
1244 * disk super block in a buffer.
1245 *
1246 * However, this function is still used to set the fs valid
1247 * flags to 0. We need to set this flag to 0 since the fs
1248 * may have been checked while mounted and e2fsck may have
1249 * set s_state to EXT2_VALID_FS after some corrections.
1250 */
1251 static int ext2_sync_fs(struct super_block *sb, int wait)
1252 {
1253 struct ext2_sb_info *sbi = EXT2_SB(sb);
1254 struct ext2_super_block *es = EXT2_SB(sb)->s_es;
1255
1256 /*
1257 * Write quota structures to quota file, sync_blockdev() will write
1258 * them to disk later
1259 */
1260 dquot_writeback_dquots(sb, -1);
1261
1262 spin_lock(&sbi->s_lock);
1263 if (es->s_state & cpu_to_le16(EXT2_VALID_FS)) {
1264 ext2_debug("setting valid to 0\n");
1265 es->s_state &= cpu_to_le16(~EXT2_VALID_FS);
1266 }
1267 spin_unlock(&sbi->s_lock);
1268 ext2_sync_super(sb, es, wait);
1269 return 0;
1270 }
1271
1272 static int ext2_freeze(struct super_block *sb)
1273 {
1274 struct ext2_sb_info *sbi = EXT2_SB(sb);
1275
1276 /*
1277 * Open but unlinked files present? Keep EXT2_VALID_FS flag cleared
1278 * because we have unattached inodes and thus filesystem is not fully
1279 * consistent.
1280 */
1281 if (atomic_long_read(&sb->s_remove_count)) {
1282 ext2_sync_fs(sb, 1);
1283 return 0;
1284 }
1285 /* Set EXT2_FS_VALID flag */
1286 spin_lock(&sbi->s_lock);
1287 sbi->s_es->s_state = cpu_to_le16(sbi->s_mount_state);
1288 spin_unlock(&sbi->s_lock);
1289 ext2_sync_super(sb, sbi->s_es, 1);
1290
1291 return 0;
1292 }
1293
1294 static int ext2_unfreeze(struct super_block *sb)
1295 {
1296 /* Just write sb to clear EXT2_VALID_FS flag */
1297 ext2_write_super(sb);
1298
1299 return 0;
1300 }
1301
1302 static void ext2_write_super(struct super_block *sb)
1303 {
1304 if (!(sb->s_flags & MS_RDONLY))
1305 ext2_sync_fs(sb, 1);
1306 }
1307
1308 static int ext2_remount (struct super_block * sb, int * flags, char * data)
1309 {
1310 struct ext2_sb_info * sbi = EXT2_SB(sb);
1311 struct ext2_super_block * es;
1312 struct ext2_mount_options old_opts;
1313 unsigned long old_sb_flags;
1314 int err;
1315
1316 sync_filesystem(sb);
1317 spin_lock(&sbi->s_lock);
1318
1319 /* Store the old options */
1320 old_sb_flags = sb->s_flags;
1321 old_opts.s_mount_opt = sbi->s_mount_opt;
1322 old_opts.s_resuid = sbi->s_resuid;
1323 old_opts.s_resgid = sbi->s_resgid;
1324
1325 /*
1326 * Allow the "check" option to be passed as a remount option.
1327 */
1328 if (!parse_options(data, sb)) {
1329 err = -EINVAL;
1330 goto restore_opts;
1331 }
1332
1333 sb->s_flags = (sb->s_flags & ~MS_POSIXACL) |
1334 ((sbi->s_mount_opt & EXT2_MOUNT_POSIX_ACL) ? MS_POSIXACL : 0);
1335
1336 es = sbi->s_es;
1337 if ((sbi->s_mount_opt ^ old_opts.s_mount_opt) & EXT2_MOUNT_DAX) {
1338 ext2_msg(sb, KERN_WARNING, "warning: refusing change of "
1339 "dax flag with busy inodes while remounting");
1340 sbi->s_mount_opt ^= EXT2_MOUNT_DAX;
1341 }
1342 if ((*flags & MS_RDONLY) == (sb->s_flags & MS_RDONLY)) {
1343 spin_unlock(&sbi->s_lock);
1344 return 0;
1345 }
1346 if (*flags & MS_RDONLY) {
1347 if (le16_to_cpu(es->s_state) & EXT2_VALID_FS ||
1348 !(sbi->s_mount_state & EXT2_VALID_FS)) {
1349 spin_unlock(&sbi->s_lock);
1350 return 0;
1351 }
1352
1353 /*
1354 * OK, we are remounting a valid rw partition rdonly, so set
1355 * the rdonly flag and then mark the partition as valid again.
1356 */
1357 es->s_state = cpu_to_le16(sbi->s_mount_state);
1358 es->s_mtime = cpu_to_le32(get_seconds());
1359 spin_unlock(&sbi->s_lock);
1360
1361 err = dquot_suspend(sb, -1);
1362 if (err < 0) {
1363 spin_lock(&sbi->s_lock);
1364 goto restore_opts;
1365 }
1366
1367 ext2_sync_super(sb, es, 1);
1368 } else {
1369 __le32 ret = EXT2_HAS_RO_COMPAT_FEATURE(sb,
1370 ~EXT2_FEATURE_RO_COMPAT_SUPP);
1371 if (ret) {
1372 ext2_msg(sb, KERN_WARNING,
1373 "warning: couldn't remount RDWR because of "
1374 "unsupported optional features (%x).",
1375 le32_to_cpu(ret));
1376 err = -EROFS;
1377 goto restore_opts;
1378 }
1379 /*
1380 * Mounting a RDONLY partition read-write, so reread and
1381 * store the current valid flag. (It may have been changed
1382 * by e2fsck since we originally mounted the partition.)
1383 */
1384 sbi->s_mount_state = le16_to_cpu(es->s_state);
1385 if (!ext2_setup_super (sb, es, 0))
1386 sb->s_flags &= ~MS_RDONLY;
1387 spin_unlock(&sbi->s_lock);
1388
1389 ext2_write_super(sb);
1390
1391 dquot_resume(sb, -1);
1392 }
1393
1394 return 0;
1395 restore_opts:
1396 sbi->s_mount_opt = old_opts.s_mount_opt;
1397 sbi->s_resuid = old_opts.s_resuid;
1398 sbi->s_resgid = old_opts.s_resgid;
1399 sb->s_flags = old_sb_flags;
1400 spin_unlock(&sbi->s_lock);
1401 return err;
1402 }
1403
1404 static int ext2_statfs (struct dentry * dentry, struct kstatfs * buf)
1405 {
1406 struct super_block *sb = dentry->d_sb;
1407 struct ext2_sb_info *sbi = EXT2_SB(sb);
1408 struct ext2_super_block *es = sbi->s_es;
1409 u64 fsid;
1410
1411 spin_lock(&sbi->s_lock);
1412
1413 if (test_opt (sb, MINIX_DF))
1414 sbi->s_overhead_last = 0;
1415 else if (sbi->s_blocks_last != le32_to_cpu(es->s_blocks_count)) {
1416 unsigned long i, overhead = 0;
1417 smp_rmb();
1418
1419 /*
1420 * Compute the overhead (FS structures). This is constant
1421 * for a given filesystem unless the number of block groups
1422 * changes so we cache the previous value until it does.
1423 */
1424
1425 /*
1426 * All of the blocks before first_data_block are
1427 * overhead
1428 */
1429 overhead = le32_to_cpu(es->s_first_data_block);
1430
1431 /*
1432 * Add the overhead attributed to the superblock and
1433 * block group descriptors. If the sparse superblocks
1434 * feature is turned on, then not all groups have this.
1435 */
1436 for (i = 0; i < sbi->s_groups_count; i++)
1437 overhead += ext2_bg_has_super(sb, i) +
1438 ext2_bg_num_gdb(sb, i);
1439
1440 /*
1441 * Every block group has an inode bitmap, a block
1442 * bitmap, and an inode table.
1443 */
1444 overhead += (sbi->s_groups_count *
1445 (2 + sbi->s_itb_per_group));
1446 sbi->s_overhead_last = overhead;
1447 smp_wmb();
1448 sbi->s_blocks_last = le32_to_cpu(es->s_blocks_count);
1449 }
1450
1451 buf->f_type = EXT2_SUPER_MAGIC;
1452 buf->f_bsize = sb->s_blocksize;
1453 buf->f_blocks = le32_to_cpu(es->s_blocks_count) - sbi->s_overhead_last;
1454 buf->f_bfree = ext2_count_free_blocks(sb);
1455 es->s_free_blocks_count = cpu_to_le32(buf->f_bfree);
1456 buf->f_bavail = buf->f_bfree - le32_to_cpu(es->s_r_blocks_count);
1457 if (buf->f_bfree < le32_to_cpu(es->s_r_blocks_count))
1458 buf->f_bavail = 0;
1459 buf->f_files = le32_to_cpu(es->s_inodes_count);
1460 buf->f_ffree = ext2_count_free_inodes(sb);
1461 es->s_free_inodes_count = cpu_to_le32(buf->f_ffree);
1462 buf->f_namelen = EXT2_NAME_LEN;
1463 fsid = le64_to_cpup((void *)es->s_uuid) ^
1464 le64_to_cpup((void *)es->s_uuid + sizeof(u64));
1465 buf->f_fsid.val[0] = fsid & 0xFFFFFFFFUL;
1466 buf->f_fsid.val[1] = (fsid >> 32) & 0xFFFFFFFFUL;
1467 spin_unlock(&sbi->s_lock);
1468 return 0;
1469 }
1470
1471 static struct dentry *ext2_mount(struct file_system_type *fs_type,
1472 int flags, const char *dev_name, void *data)
1473 {
1474 return mount_bdev(fs_type, flags, dev_name, data, ext2_fill_super);
1475 }
1476
1477 #ifdef CONFIG_QUOTA
1478
1479 /* Read data from quotafile - avoid pagecache and such because we cannot afford
1480 * acquiring the locks... As quota files are never truncated and quota code
1481 * itself serializes the operations (and no one else should touch the files)
1482 * we don't have to be afraid of races */
1483 static ssize_t ext2_quota_read(struct super_block *sb, int type, char *data,
1484 size_t len, loff_t off)
1485 {
1486 struct inode *inode = sb_dqopt(sb)->files[type];
1487 sector_t blk = off >> EXT2_BLOCK_SIZE_BITS(sb);
1488 int err = 0;
1489 int offset = off & (sb->s_blocksize - 1);
1490 int tocopy;
1491 size_t toread;
1492 struct buffer_head tmp_bh;
1493 struct buffer_head *bh;
1494 loff_t i_size = i_size_read(inode);
1495
1496 if (off > i_size)
1497 return 0;
1498 if (off+len > i_size)
1499 len = i_size-off;
1500 toread = len;
1501 while (toread > 0) {
1502 tocopy = sb->s_blocksize - offset < toread ?
1503 sb->s_blocksize - offset : toread;
1504
1505 tmp_bh.b_state = 0;
1506 tmp_bh.b_size = sb->s_blocksize;
1507 err = ext2_get_block(inode, blk, &tmp_bh, 0);
1508 if (err < 0)
1509 return err;
1510 if (!buffer_mapped(&tmp_bh)) /* A hole? */
1511 memset(data, 0, tocopy);
1512 else {
1513 bh = sb_bread(sb, tmp_bh.b_blocknr);
1514 if (!bh)
1515 return -EIO;
1516 memcpy(data, bh->b_data+offset, tocopy);
1517 brelse(bh);
1518 }
1519 offset = 0;
1520 toread -= tocopy;
1521 data += tocopy;
1522 blk++;
1523 }
1524 return len;
1525 }
1526
1527 /* Write to quotafile */
1528 static ssize_t ext2_quota_write(struct super_block *sb, int type,
1529 const char *data, size_t len, loff_t off)
1530 {
1531 struct inode *inode = sb_dqopt(sb)->files[type];
1532 sector_t blk = off >> EXT2_BLOCK_SIZE_BITS(sb);
1533 int err = 0;
1534 int offset = off & (sb->s_blocksize - 1);
1535 int tocopy;
1536 size_t towrite = len;
1537 struct buffer_head tmp_bh;
1538 struct buffer_head *bh;
1539
1540 while (towrite > 0) {
1541 tocopy = sb->s_blocksize - offset < towrite ?
1542 sb->s_blocksize - offset : towrite;
1543
1544 tmp_bh.b_state = 0;
1545 tmp_bh.b_size = sb->s_blocksize;
1546 err = ext2_get_block(inode, blk, &tmp_bh, 1);
1547 if (err < 0)
1548 goto out;
1549 if (offset || tocopy != EXT2_BLOCK_SIZE(sb))
1550 bh = sb_bread(sb, tmp_bh.b_blocknr);
1551 else
1552 bh = sb_getblk(sb, tmp_bh.b_blocknr);
1553 if (unlikely(!bh)) {
1554 err = -EIO;
1555 goto out;
1556 }
1557 lock_buffer(bh);
1558 memcpy(bh->b_data+offset, data, tocopy);
1559 flush_dcache_page(bh->b_page);
1560 set_buffer_uptodate(bh);
1561 mark_buffer_dirty(bh);
1562 unlock_buffer(bh);
1563 brelse(bh);
1564 offset = 0;
1565 towrite -= tocopy;
1566 data += tocopy;
1567 blk++;
1568 }
1569 out:
1570 if (len == towrite)
1571 return err;
1572 if (inode->i_size < off+len-towrite)
1573 i_size_write(inode, off+len-towrite);
1574 inode->i_version++;
1575 inode->i_mtime = inode->i_ctime = current_time(inode);
1576 mark_inode_dirty(inode);
1577 return len - towrite;
1578 }
1579
1580 static int ext2_quota_on(struct super_block *sb, int type, int format_id,
1581 const struct path *path)
1582 {
1583 int err;
1584 struct inode *inode;
1585
1586 err = dquot_quota_on(sb, type, format_id, path);
1587 if (err)
1588 return err;
1589
1590 inode = d_inode(path->dentry);
1591 inode_lock(inode);
1592 EXT2_I(inode)->i_flags |= EXT2_NOATIME_FL | EXT2_IMMUTABLE_FL;
1593 inode_set_flags(inode, S_NOATIME | S_IMMUTABLE,
1594 S_NOATIME | S_IMMUTABLE);
1595 inode_unlock(inode);
1596 mark_inode_dirty(inode);
1597
1598 return 0;
1599 }
1600
1601 static int ext2_quota_off(struct super_block *sb, int type)
1602 {
1603 struct inode *inode = sb_dqopt(sb)->files[type];
1604 int err;
1605
1606 if (!inode || !igrab(inode))
1607 goto out;
1608
1609 err = dquot_quota_off(sb, type);
1610 if (err)
1611 goto out_put;
1612
1613 inode_lock(inode);
1614 EXT2_I(inode)->i_flags &= ~(EXT2_NOATIME_FL | EXT2_IMMUTABLE_FL);
1615 inode_set_flags(inode, 0, S_NOATIME | S_IMMUTABLE);
1616 inode_unlock(inode);
1617 mark_inode_dirty(inode);
1618 out_put:
1619 iput(inode);
1620 return err;
1621 out:
1622 return dquot_quota_off(sb, type);
1623 }
1624
1625 #endif
1626
1627 static struct file_system_type ext2_fs_type = {
1628 .owner = THIS_MODULE,
1629 .name = "ext2",
1630 .mount = ext2_mount,
1631 .kill_sb = kill_block_super,
1632 .fs_flags = FS_REQUIRES_DEV,
1633 };
1634 MODULE_ALIAS_FS("ext2");
1635
1636 static int __init init_ext2_fs(void)
1637 {
1638 int err;
1639
1640 err = init_inodecache();
1641 if (err)
1642 return err;
1643 err = register_filesystem(&ext2_fs_type);
1644 if (err)
1645 goto out;
1646 return 0;
1647 out:
1648 destroy_inodecache();
1649 return err;
1650 }
1651
1652 static void __exit exit_ext2_fs(void)
1653 {
1654 unregister_filesystem(&ext2_fs_type);
1655 destroy_inodecache();
1656 }
1657
1658 MODULE_AUTHOR("Remy Card and others");
1659 MODULE_DESCRIPTION("Second Extended Filesystem");
1660 MODULE_LICENSE("GPL");
1661 module_init(init_ext2_fs)
1662 module_exit(exit_ext2_fs)