Imported Upstream version 0.6.5.3

[mirror_zfs-debian.git] / module / zfs / zpl_super.c
diff --git a/module/zfs/zpl_super.c b/module/zfs/zpl_super.c

index eee4a50e03a569932e22c270e7c492e4d8ec158a..bcdbbd69e2808e56d8b6588f9ed77aab19b5b745 100644 (file)
--- a/module/zfs/zpl_super.c
+++ b/module/zfs/zpl_super.c
@@ -44,7 +44,7 @@ zpl_inode_alloc(struct super_block *sb)
  static void
  zpl_inode_destroy(struct inode *ip)
  {
-        ASSERT(atomic_read(&ip->i_count) == 0);
+       ASSERT(atomic_read(&ip->i_count) == 0);
         zfs_inode_destroy(ip);
  }
  
@@ -57,13 +57,21 @@ zpl_inode_destroy(struct inode *ip)
  static void
  zpl_dirty_inode(struct inode *ip, int flags)
  {
+       fstrans_cookie_t cookie;
+
+       cookie = spl_fstrans_mark();
         zfs_dirty_inode(ip, flags);
+       spl_fstrans_unmark(cookie);
  }
  #else
  static void
  zpl_dirty_inode(struct inode *ip)
  {
+       fstrans_cookie_t cookie;
+
+       cookie = spl_fstrans_mark();
         zfs_dirty_inode(ip, 0);
+       spl_fstrans_unmark(cookie);
  }
  #endif /* HAVE_DIRTY_INODE_WITH_FLAGS */
  
@@ -98,17 +106,31 @@ zpl_dirty_inode(struct inode *ip)
  static void
  zpl_evict_inode(struct inode *ip)
  {
+       fstrans_cookie_t cookie;
+
+       cookie = spl_fstrans_mark();
         truncate_setsize(ip, 0);
         clear_inode(ip);
         zfs_inactive(ip);
+       spl_fstrans_unmark(cookie);
  }
  
  #else
  
+static void
+zpl_drop_inode(struct inode *ip)
+{
+       generic_delete_inode(ip);
+}
+
  static void
  zpl_clear_inode(struct inode *ip)
  {
+       fstrans_cookie_t cookie;
+
+       cookie = spl_fstrans_mark();
         zfs_inactive(ip);
+       spl_fstrans_unmark(cookie);
  }
  
  static void
@@ -117,26 +139,31 @@ zpl_inode_delete(struct inode *ip)
         truncate_setsize(ip, 0);
         clear_inode(ip);
  }
-
  #endif /* HAVE_EVICT_INODE */
  
  static void
  zpl_put_super(struct super_block *sb)
  {
+       fstrans_cookie_t cookie;
         int error;
  
+       cookie = spl_fstrans_mark();
         error = -zfs_umount(sb);
+       spl_fstrans_unmark(cookie);
         ASSERT3S(error, <=, 0);
  }
  
  static int
  zpl_sync_fs(struct super_block *sb, int wait)
  {
+       fstrans_cookie_t cookie;
         cred_t *cr = CRED();
         int error;
  
         crhold(cr);
+       cookie = spl_fstrans_mark();
         error = -zfs_sync(sb, wait, cr);
+       spl_fstrans_unmark(cookie);
         crfree(cr);
         ASSERT3S(error, <=, 0);
  
@@ -146,70 +173,271 @@ zpl_sync_fs(struct super_block *sb, int wait)
  static int
  zpl_statfs(struct dentry *dentry, struct kstatfs *statp)
  {
+       fstrans_cookie_t cookie;
         int error;
  
+       cookie = spl_fstrans_mark();
         error = -zfs_statvfs(dentry, statp);
+       spl_fstrans_unmark(cookie);
         ASSERT3S(error, <=, 0);
  
         return (error);
  }
  
+enum {
+       TOKEN_RO,
+       TOKEN_RW,
+       TOKEN_SETUID,
+       TOKEN_NOSETUID,
+       TOKEN_EXEC,
+       TOKEN_NOEXEC,
+       TOKEN_DEVICES,
+       TOKEN_NODEVICES,
+       TOKEN_DIRXATTR,
+       TOKEN_SAXATTR,
+       TOKEN_XATTR,
+       TOKEN_NOXATTR,
+       TOKEN_ATIME,
+       TOKEN_NOATIME,
+       TOKEN_RELATIME,
+       TOKEN_NORELATIME,
+       TOKEN_NBMAND,
+       TOKEN_NONBMAND,
+       TOKEN_MNTPOINT,
+       TOKEN_LAST,
+};
+
+static const match_table_t zpl_tokens = {
+       { TOKEN_RO,             MNTOPT_RO },
+       { TOKEN_RW,             MNTOPT_RW },
+       { TOKEN_SETUID,         MNTOPT_SETUID },
+       { TOKEN_NOSETUID,       MNTOPT_NOSETUID },
+       { TOKEN_EXEC,           MNTOPT_EXEC },
+       { TOKEN_NOEXEC,         MNTOPT_NOEXEC },
+       { TOKEN_DEVICES,        MNTOPT_DEVICES },
+       { TOKEN_NODEVICES,      MNTOPT_NODEVICES },
+       { TOKEN_DIRXATTR,       MNTOPT_DIRXATTR },
+       { TOKEN_SAXATTR,        MNTOPT_SAXATTR },
+       { TOKEN_XATTR,          MNTOPT_XATTR },
+       { TOKEN_NOXATTR,        MNTOPT_NOXATTR },
+       { TOKEN_ATIME,          MNTOPT_ATIME },
+       { TOKEN_NOATIME,        MNTOPT_NOATIME },
+       { TOKEN_RELATIME,       MNTOPT_RELATIME },
+       { TOKEN_NORELATIME,     MNTOPT_NORELATIME },
+       { TOKEN_NBMAND,         MNTOPT_NBMAND },
+       { TOKEN_NONBMAND,       MNTOPT_NONBMAND },
+       { TOKEN_MNTPOINT,       MNTOPT_MNTPOINT "=%s" },
+       { TOKEN_LAST,           NULL },
+};
+
+static int
+zpl_parse_option(char *option, int token, substring_t *args, zfs_mntopts_t *zmo)
+{
+       switch (token) {
+       case TOKEN_RO:
+               zmo->z_readonly = B_TRUE;
+               zmo->z_do_readonly = B_TRUE;
+               break;
+       case TOKEN_RW:
+               zmo->z_readonly = B_FALSE;
+               zmo->z_do_readonly = B_TRUE;
+               break;
+       case TOKEN_SETUID:
+               zmo->z_setuid = B_TRUE;
+               zmo->z_do_setuid = B_TRUE;
+               break;
+       case TOKEN_NOSETUID:
+               zmo->z_setuid = B_FALSE;
+               zmo->z_do_setuid = B_TRUE;
+               break;
+       case TOKEN_EXEC:
+               zmo->z_exec = B_TRUE;
+               zmo->z_do_exec = B_TRUE;
+               break;
+       case TOKEN_NOEXEC:
+               zmo->z_exec = B_FALSE;
+               zmo->z_do_exec = B_TRUE;
+               break;
+       case TOKEN_DEVICES:
+               zmo->z_devices = B_TRUE;
+               zmo->z_do_devices = B_TRUE;
+               break;
+       case TOKEN_NODEVICES:
+               zmo->z_devices = B_FALSE;
+               zmo->z_do_devices = B_TRUE;
+               break;
+       case TOKEN_DIRXATTR:
+               zmo->z_xattr = ZFS_XATTR_DIR;
+               zmo->z_do_xattr = B_TRUE;
+               break;
+       case TOKEN_SAXATTR:
+               zmo->z_xattr = ZFS_XATTR_SA;
+               zmo->z_do_xattr = B_TRUE;
+               break;
+       case TOKEN_XATTR:
+               zmo->z_xattr = ZFS_XATTR_DIR;
+               zmo->z_do_xattr = B_TRUE;
+               break;
+       case TOKEN_NOXATTR:
+               zmo->z_xattr = ZFS_XATTR_OFF;
+               zmo->z_do_xattr = B_TRUE;
+               break;
+       case TOKEN_ATIME:
+               zmo->z_atime = B_TRUE;
+               zmo->z_do_atime = B_TRUE;
+               break;
+       case TOKEN_NOATIME:
+               zmo->z_atime = B_FALSE;
+               zmo->z_do_atime = B_TRUE;
+               break;
+       case TOKEN_RELATIME:
+               zmo->z_relatime = B_TRUE;
+               zmo->z_do_relatime = B_TRUE;
+               break;
+       case TOKEN_NORELATIME:
+               zmo->z_relatime = B_FALSE;
+               zmo->z_do_relatime = B_TRUE;
+               break;
+       case TOKEN_NBMAND:
+               zmo->z_nbmand = B_TRUE;
+               zmo->z_do_nbmand = B_TRUE;
+               break;
+       case TOKEN_NONBMAND:
+               zmo->z_nbmand = B_FALSE;
+               zmo->z_do_nbmand = B_TRUE;
+               break;
+       case TOKEN_MNTPOINT:
+               zmo->z_mntpoint = match_strdup(&args[0]);
+               if (zmo->z_mntpoint == NULL)
+                       return (-ENOMEM);
+
+               break;
+       default:
+               break;
+       }
+
+       return (0);
+}
+
+/*
+ * Parse the mntopts string storing the results in provided zmo argument.
+ * If an error occurs the zmo argument will not be modified.  The caller
+ * needs to set isremount when recycling an existing zfs_mntopts_t.
+ */
+static int
+zpl_parse_options(char *osname, char *mntopts, zfs_mntopts_t *zmo,
+    boolean_t isremount)
+{
+       zfs_mntopts_t *tmp_zmo;
+       int error;
+
+       tmp_zmo = zfs_mntopts_alloc();
+       tmp_zmo->z_osname = strdup(osname);
+
+       if (mntopts) {
+               substring_t args[MAX_OPT_ARGS];
+               char *tmp_mntopts, *p;
+               int token;
+
+               tmp_mntopts = strdup(mntopts);
+
+               while ((p = strsep(&tmp_mntopts, ",")) != NULL) {
+                       if (!*p)
+                               continue;
+
+                       args[0].to = args[0].from = NULL;
+                       token = match_token(p, zpl_tokens, args);
+                       error = zpl_parse_option(p, token, args, tmp_zmo);
+                       if (error) {
+                               zfs_mntopts_free(tmp_zmo);
+                               strfree(tmp_mntopts);
+                               return (error);
+                       }
+               }
+
+               strfree(tmp_mntopts);
+       }
+
+       if (isremount == B_TRUE) {
+               if (zmo->z_osname)
+                       strfree(zmo->z_osname);
+
+               if (zmo->z_mntpoint)
+                       strfree(zmo->z_mntpoint);
+       } else {
+               ASSERT3P(zmo->z_osname, ==, NULL);
+               ASSERT3P(zmo->z_mntpoint, ==, NULL);
+       }
+
+       memcpy(zmo, tmp_zmo, sizeof (zfs_mntopts_t));
+       kmem_free(tmp_zmo, sizeof (zfs_mntopts_t));
+
+       return (0);
+}
+
  static int
  zpl_remount_fs(struct super_block *sb, int *flags, char *data)
  {
+       zfs_sb_t *zsb = sb->s_fs_info;
+       fstrans_cookie_t cookie;
         int error;
-       error = -zfs_remount(sb, flags, data);
+
+       error = zpl_parse_options(zsb->z_mntopts->z_osname, data,
+           zsb->z_mntopts, B_TRUE);
+       if (error)
+               return (error);
+
+       cookie = spl_fstrans_mark();
+       error = -zfs_remount(sb, flags, zsb->z_mntopts);
+       spl_fstrans_unmark(cookie);
         ASSERT3S(error, <=, 0);
  
         return (error);
  }
  
-static void
-zpl_umount_begin(struct super_block *sb)
+static int
+__zpl_show_options(struct seq_file *seq, zfs_sb_t *zsb)
  {
-       zfs_sb_t *zsb = sb->s_fs_info;
-       int count;
-
-       /*
-        * Best effort to unmount snapshots in .zfs/snapshot/.  Normally this
-        * isn't required because snapshots have the MNT_SHRINKABLE flag set.
-        */
-       if (zsb->z_ctldir)
-               (void) zfsctl_unmount_snapshots(zsb, MNT_FORCE, &count);
+       seq_printf(seq, ",%s", zsb->z_flags & ZSB_XATTR ? "xattr" : "noxattr");
+
+#ifdef CONFIG_FS_POSIX_ACL
+       switch (zsb->z_acl_type) {
+       case ZFS_ACLTYPE_POSIXACL:
+               seq_puts(seq, ",posixacl");
+               break;
+       default:
+               seq_puts(seq, ",noacl");
+               break;
+       }
+#endif /* CONFIG_FS_POSIX_ACL */
+
+       return (0);
  }
  
-/*
- * The Linux VFS automatically handles the following flags:
- * MNT_NOSUID, MNT_NODEV, MNT_NOEXEC, MNT_NOATIME, MNT_READONLY
- */
  #ifdef HAVE_SHOW_OPTIONS_WITH_DENTRY
  static int
  zpl_show_options(struct seq_file *seq, struct dentry *root)
  {
-       zfs_sb_t *zsb = root->d_sb->s_fs_info;
-
-       seq_printf(seq, ",%s", zsb->z_flags & ZSB_XATTR ? "xattr" : "noxattr");
-
-       return (0);
+       return (__zpl_show_options(seq, root->d_sb->s_fs_info));
  }
  #else
  static int
  zpl_show_options(struct seq_file *seq, struct vfsmount *vfsp)
  {
-       zfs_sb_t *zsb = vfsp->mnt_sb->s_fs_info;
-
-       seq_printf(seq, ",%s", zsb->z_flags & ZSB_XATTR ? "xattr" : "noxattr");
-
-       return (0);
+       return (__zpl_show_options(seq, vfsp->mnt_sb->s_fs_info));
  }
  #endif /* HAVE_SHOW_OPTIONS_WITH_DENTRY */
  
  static int
  zpl_fill_super(struct super_block *sb, void *data, int silent)
  {
+       zfs_mntopts_t *zmo = (zfs_mntopts_t *)data;
+       fstrans_cookie_t cookie;
         int error;
  
-       error = -zfs_domount(sb, data, silent);
+       cookie = spl_fstrans_mark();
+       error = -zfs_domount(sb, zmo, silent);
+       spl_fstrans_unmark(cookie);
         ASSERT3S(error, <=, 0);
  
         return (error);
@@ -220,18 +448,32 @@ static struct dentry *
  zpl_mount(struct file_system_type *fs_type, int flags,
      const char *osname, void *data)
  {
-       zpl_mount_data_t zmd = { osname, data };
+       zfs_mntopts_t *zmo = zfs_mntopts_alloc();
+       int error;
+
+       error = zpl_parse_options((char *)osname, (char *)data, zmo, B_FALSE);
+       if (error) {
+               zfs_mntopts_free(zmo);
+               return (ERR_PTR(error));
+       }
  
-       return mount_nodev(fs_type, flags, &zmd, zpl_fill_super);
+       return (mount_nodev(fs_type, flags, zmo, zpl_fill_super));
  }
  #else
  static int
  zpl_get_sb(struct file_system_type *fs_type, int flags,
      const char *osname, void *data, struct vfsmount *mnt)
  {
-       zpl_mount_data_t zmd = { osname, data };
+       zfs_mntopts_t *zmo = zfs_mntopts_alloc();
+       int error;
+
+       error = zpl_parse_options((char *)osname, (char *)data, zmo, B_FALSE);
+       if (error) {
+               zfs_mntopts_free(zmo);
+               return (error);
+       }
  
-       return get_sb_nodev(fs_type, flags, &zmd, zpl_fill_super, mnt);
+       return (get_sb_nodev(fs_type, flags, zmo, zpl_fill_super, mnt));
  }
  #endif /* HAVE_MOUNT_NODEV */
  
@@ -246,83 +488,28 @@ zpl_kill_sb(struct super_block *sb)
  #endif /* HAVE_S_INSTANCES_LIST_HEAD */
  }
  
-#ifdef HAVE_SHRINK
-/*
- * Linux 3.1 - 3.x API
- *
- * The Linux 3.1 API introduced per-sb cache shrinkers to replace the
- * global ones.  This allows us a mechanism to cleanly target a specific
- * zfs file system when the dnode and inode caches grow too large.
- *
- * In addition, the 3.0 kernel added the iterate_supers_type() helper
- * function which is used to safely walk all of the zfs file systems.
- */
-static void
-zpl_prune_sb(struct super_block *sb, void *arg)
-{
-       int objects = 0;
-       int error;
-
-       error = -zfs_sb_prune(sb, *(unsigned long *)arg, &objects);
-       ASSERT3S(error, <=, 0);
-
-       return;
-}
-
-void
-zpl_prune_sbs(int64_t bytes_to_scan, void *private)
-{
-       unsigned long nr_to_scan = (bytes_to_scan / sizeof(znode_t));
-
-       iterate_supers_type(&zpl_fs_type, zpl_prune_sb, &nr_to_scan);
-       kmem_reap();
-}
-#else
-/*
- * Linux 2.6.x - 3.0 API
- *
- * These are best effort interfaces are provided by the SPL to induce
- * the Linux VM subsystem to reclaim a fraction of the both dnode and
- * inode caches.  Ideally, we want to just target the zfs file systems
- * however our only option is to reclaim from them all.
- */
  void
-zpl_prune_sbs(int64_t bytes_to_scan, void *private)
+zpl_prune_sb(int64_t nr_to_scan, void *arg)
  {
-       unsigned long nr_to_scan = (bytes_to_scan / sizeof(znode_t));
+       struct super_block *sb = (struct super_block *)arg;
+       int objects = 0;
  
-        shrink_dcache_memory(nr_to_scan, GFP_KERNEL);
-        shrink_icache_memory(nr_to_scan, GFP_KERNEL);
-        kmem_reap();
+       (void) -zfs_sb_prune(sb, nr_to_scan, &objects);
  }
-#endif /* HAVE_SHRINK */
  
  #ifdef HAVE_NR_CACHED_OBJECTS
  static int
  zpl_nr_cached_objects(struct super_block *sb)
  {
-       zfs_sb_t *zsb = sb->s_fs_info;
-       int nr;
-
-       mutex_enter(&zsb->z_znodes_lock);
-       nr = zsb->z_nr_znodes;
-       mutex_exit(&zsb->z_znodes_lock);
-
-       return (nr);
+       return (0);
  }
  #endif /* HAVE_NR_CACHED_OBJECTS */
  
  #ifdef HAVE_FREE_CACHED_OBJECTS
-/*
- * Attempt to evict some meta data from the cache.  The ARC operates in
- * terms of bytes while the Linux VFS uses objects.  Now because this is
- * just a best effort eviction and the exact values aren't critical so we
- * extrapolate from an object count to a byte size using the znode_t size.
- */
  static void
  zpl_free_cached_objects(struct super_block *sb, int nr_to_scan)
  {
-       arc_adjust_meta(nr_to_scan * sizeof(znode_t), B_FALSE);
+       /* noop */
  }
  #endif /* HAVE_FREE_CACHED_OBJECTS */
  
@@ -331,10 +518,10 @@ const struct super_operations zpl_super_operations = {
         .destroy_inode          = zpl_inode_destroy,
         .dirty_inode            = zpl_dirty_inode,
         .write_inode            = NULL,
-       .drop_inode             = NULL,
  #ifdef HAVE_EVICT_INODE
         .evict_inode            = zpl_evict_inode,
  #else
+       .drop_inode             = zpl_drop_inode,
         .clear_inode            = zpl_clear_inode,
         .delete_inode           = zpl_inode_delete,
  #endif /* HAVE_EVICT_INODE */
@@ -342,7 +529,6 @@ const struct super_operations zpl_super_operations = {
         .sync_fs                = zpl_sync_fs,
         .statfs                 = zpl_statfs,
         .remount_fs             = zpl_remount_fs,
-       .umount_begin           = zpl_umount_begin,
         .show_options           = zpl_show_options,
         .show_stats             = NULL,
  #ifdef HAVE_NR_CACHED_OBJECTS