]> git.proxmox.com Git - mirror_zfs.git/blobdiff - module/zfs/zfs_acl.c
Fix typo/etc in module/zfs/zfs_ctldir.c
[mirror_zfs.git] / module / zfs / zfs_acl.c
index 12ffe9f30a1413e27ec82d05de44eb2761f58fe7..b1af4da2f4a5f8e0fd8e816e94e376717eaf6f08 100644 (file)
  * CDDL HEADER END
  */
 /*
- * Copyright 2009 Sun Microsystems, Inc.  All rights reserved.
- * Use is subject to license terms.
+ * Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved.
+ * Copyright (c) 2013 by Delphix. All rights reserved.
  */
 
+
 #include <sys/types.h>
 #include <sys/param.h>
 #include <sys/time.h>
-#include <sys/systm.h>
 #include <sys/sysmacros.h>
-#include <sys/resource.h>
 #include <sys/vfs.h>
 #include <sys/vnode.h>
 #include <sys/sid.h>
@@ -37,7 +36,6 @@
 #include <sys/kmem.h>
 #include <sys/cmn_err.h>
 #include <sys/errno.h>
-#include <sys/unistd.h>
 #include <sys/sdt.h>
 #include <sys/fs/zfs.h>
 #include <sys/mode.h>
@@ -50,8 +48,9 @@
 #include <sys/dmu.h>
 #include <sys/dnode.h>
 #include <sys/zap.h>
-#include "fs/fs_subr.h"
-#include <acl/acl_common.h>
+#include <sys/sa.h>
+#include <sys/trace_acl.h>
+#include <sys/zpl.h>
 
 #define        ALLOW   ACE_ACCESS_ALLOWED_ACE_TYPE
 #define        DENY    ACE_ACCESS_DENIED_ACE_TYPE
@@ -95,6 +94,8 @@
 
 #define        ALL_MODE_EXECS (S_IXUSR | S_IXGRP | S_IXOTH)
 
+#define        IDMAP_WK_CREATOR_OWNER_UID      2147483648U
+
 static uint16_t
 zfs_ace_v0_get_type(void *acep)
 {
@@ -171,18 +172,18 @@ zfs_ace_v0_data(void *acep, void **datap)
 }
 
 static acl_ops_t zfs_acl_v0_ops = {
-       zfs_ace_v0_get_mask,
-       zfs_ace_v0_set_mask,
-       zfs_ace_v0_get_flags,
-       zfs_ace_v0_set_flags,
-       zfs_ace_v0_get_type,
-       zfs_ace_v0_set_type,
-       zfs_ace_v0_get_who,
-       zfs_ace_v0_set_who,
-       zfs_ace_v0_size,
-       zfs_ace_v0_abstract_size,
-       zfs_ace_v0_mask_off,
-       zfs_ace_v0_data
+       .ace_mask_get = zfs_ace_v0_get_mask,
+       .ace_mask_set = zfs_ace_v0_set_mask,
+       .ace_flags_get = zfs_ace_v0_get_flags,
+       .ace_flags_set = zfs_ace_v0_set_flags,
+       .ace_type_get = zfs_ace_v0_get_type,
+       .ace_type_set = zfs_ace_v0_set_type,
+       .ace_who_get = zfs_ace_v0_get_who,
+       .ace_who_set = zfs_ace_v0_set_who,
+       .ace_size = zfs_ace_v0_size,
+       .ace_abstract_size = zfs_ace_v0_abstract_size,
+       .ace_mask_off = zfs_ace_v0_mask_off,
+       .ace_data = zfs_ace_v0_data
 };
 
 static uint16_t
@@ -307,20 +308,131 @@ zfs_ace_fuid_data(void *acep, void **datap)
 }
 
 static acl_ops_t zfs_acl_fuid_ops = {
-       zfs_ace_fuid_get_mask,
-       zfs_ace_fuid_set_mask,
-       zfs_ace_fuid_get_flags,
-       zfs_ace_fuid_set_flags,
-       zfs_ace_fuid_get_type,
-       zfs_ace_fuid_set_type,
-       zfs_ace_fuid_get_who,
-       zfs_ace_fuid_set_who,
-       zfs_ace_fuid_size,
-       zfs_ace_fuid_abstract_size,
-       zfs_ace_fuid_mask_off,
-       zfs_ace_fuid_data
+       .ace_mask_get = zfs_ace_fuid_get_mask,
+       .ace_mask_set = zfs_ace_fuid_set_mask,
+       .ace_flags_get = zfs_ace_fuid_get_flags,
+       .ace_flags_set = zfs_ace_fuid_set_flags,
+       .ace_type_get = zfs_ace_fuid_get_type,
+       .ace_type_set = zfs_ace_fuid_set_type,
+       .ace_who_get = zfs_ace_fuid_get_who,
+       .ace_who_set = zfs_ace_fuid_set_who,
+       .ace_size = zfs_ace_fuid_size,
+       .ace_abstract_size = zfs_ace_fuid_abstract_size,
+       .ace_mask_off = zfs_ace_fuid_mask_off,
+       .ace_data = zfs_ace_fuid_data
 };
 
+/*
+ * The following three functions are provided for compatibility with
+ * older ZPL version in order to determine if the file use to have
+ * an external ACL and what version of ACL previously existed on the
+ * file.  Would really be nice to not need this, sigh.
+ */
+uint64_t
+zfs_external_acl(znode_t *zp)
+{
+       zfs_acl_phys_t acl_phys;
+       int error;
+
+       if (zp->z_is_sa)
+               return (0);
+
+       /*
+        * Need to deal with a potential
+        * race where zfs_sa_upgrade could cause
+        * z_isa_sa to change.
+        *
+        * If the lookup fails then the state of z_is_sa should have
+        * changed.
+        */
+
+       if ((error = sa_lookup(zp->z_sa_hdl, SA_ZPL_ZNODE_ACL(ZTOZSB(zp)),
+           &acl_phys, sizeof (acl_phys))) == 0)
+               return (acl_phys.z_acl_extern_obj);
+       else {
+               /*
+                * after upgrade the SA_ZPL_ZNODE_ACL should have been
+                * removed
+                */
+               VERIFY(zp->z_is_sa && error == ENOENT);
+               return (0);
+       }
+}
+
+/*
+ * Determine size of ACL in bytes
+ *
+ * This is more complicated than it should be since we have to deal
+ * with old external ACLs.
+ */
+static int
+zfs_acl_znode_info(znode_t *zp, int *aclsize, int *aclcount,
+    zfs_acl_phys_t *aclphys)
+{
+       zfsvfs_t *zfsvfs = ZTOZSB(zp);
+       uint64_t acl_count;
+       int size;
+       int error;
+
+       ASSERT(MUTEX_HELD(&zp->z_acl_lock));
+       if (zp->z_is_sa) {
+               if ((error = sa_size(zp->z_sa_hdl, SA_ZPL_DACL_ACES(zfsvfs),
+                   &size)) != 0)
+                       return (error);
+               *aclsize = size;
+               if ((error = sa_lookup(zp->z_sa_hdl, SA_ZPL_DACL_COUNT(zfsvfs),
+                   &acl_count, sizeof (acl_count))) != 0)
+                       return (error);
+               *aclcount = acl_count;
+       } else {
+               if ((error = sa_lookup(zp->z_sa_hdl, SA_ZPL_ZNODE_ACL(zfsvfs),
+                   aclphys, sizeof (*aclphys))) != 0)
+                       return (error);
+
+               if (aclphys->z_acl_version == ZFS_ACL_VERSION_INITIAL) {
+                       *aclsize = ZFS_ACL_SIZE(aclphys->z_acl_size);
+                       *aclcount = aclphys->z_acl_size;
+               } else {
+                       *aclsize = aclphys->z_acl_size;
+                       *aclcount = aclphys->z_acl_count;
+               }
+       }
+       return (0);
+}
+
+int
+zfs_znode_acl_version(znode_t *zp)
+{
+       zfs_acl_phys_t acl_phys;
+
+       if (zp->z_is_sa)
+               return (ZFS_ACL_VERSION_FUID);
+       else {
+               int error;
+
+               /*
+                * Need to deal with a potential
+                * race where zfs_sa_upgrade could cause
+                * z_isa_sa to change.
+                *
+                * If the lookup fails then the state of z_is_sa should have
+                * changed.
+                */
+               if ((error = sa_lookup(zp->z_sa_hdl,
+                   SA_ZPL_ZNODE_ACL(ZTOZSB(zp)),
+                   &acl_phys, sizeof (acl_phys))) == 0)
+                       return (acl_phys.z_acl_version);
+               else {
+                       /*
+                        * After upgrade SA_ZPL_ZNODE_ACL should have
+                        * been removed.
+                        */
+                       VERIFY(zp->z_is_sa && error == ENOENT);
+                       return (ZFS_ACL_VERSION_FUID);
+               }
+       }
+}
+
 static int
 zfs_acl_version(int version)
 {
@@ -333,10 +445,10 @@ zfs_acl_version(int version)
 static int
 zfs_acl_version_zp(znode_t *zp)
 {
-       return (zfs_acl_version(zp->z_zfsvfs->z_version));
+       return (zfs_acl_version(ZTOZSB(zp)->z_version));
 }
 
-static zfs_acl_t *
+zfs_acl_t *
 zfs_acl_alloc(int vers)
 {
        zfs_acl_t *aclp;
@@ -346,13 +458,13 @@ zfs_acl_alloc(int vers)
            offsetof(zfs_acl_node_t, z_next));
        aclp->z_version = vers;
        if (vers == ZFS_ACL_VERSION_FUID)
-               aclp->z_ops = zfs_acl_fuid_ops;
+               aclp->z_ops = &zfs_acl_fuid_ops;
        else
-               aclp->z_ops = zfs_acl_v0_ops;
+               aclp->z_ops = &zfs_acl_v0_ops;
        return (aclp);
 }
 
-static zfs_acl_node_t *
+zfs_acl_node_t *
 zfs_acl_node_alloc(size_t bytes)
 {
        zfs_acl_node_t *aclnode;
@@ -381,7 +493,7 @@ zfs_acl_release_nodes(zfs_acl_t *aclp)
 {
        zfs_acl_node_t *aclnode;
 
-       while (aclnode = list_head(&aclp->z_acl)) {
+       while ((aclnode = list_head(&aclp->z_acl))) {
                list_remove(&aclp->z_acl, aclnode);
                zfs_acl_node_free(aclnode);
        }
@@ -420,7 +532,7 @@ zfs_acl_valid_ace_type(uint_t type, uint_t flags)
 }
 
 static boolean_t
-zfs_ace_valid(vtype_t obj_type, zfs_acl_t *aclp, uint16_t type, uint16_t iflags)
+zfs_ace_valid(umode_t obj_mode, zfs_acl_t *aclp, uint16_t type, uint16_t iflags)
 {
        /*
         * first check type of entry
@@ -443,7 +555,7 @@ zfs_ace_valid(vtype_t obj_type, zfs_acl_t *aclp, uint16_t type, uint16_t iflags)
         * next check inheritance level flags
         */
 
-       if (obj_type == VDIR &&
+       if (S_ISDIR(obj_mode) &&
            (iflags & (ACE_FILE_INHERIT_ACE|ACE_DIRECTORY_INHERIT_ACE)))
                aclp->z_hints |= ZFS_INHERIT_ACE;
 
@@ -463,6 +575,8 @@ zfs_acl_next_ace(zfs_acl_t *aclp, void *start, uint64_t *who,
 {
        zfs_acl_node_t *aclnode;
 
+       ASSERT(aclp);
+
        if (start == NULL) {
                aclnode = list_head(&aclp->z_acl);
                if (aclnode == NULL)
@@ -496,19 +610,20 @@ zfs_acl_next_ace(zfs_acl_t *aclp, void *start, uint64_t *who,
                /*
                 * Make sure we don't overstep our bounds
                 */
-               ace_size = aclp->z_ops.ace_size(acep);
+               ace_size = aclp->z_ops->ace_size(acep);
 
                if (((caddr_t)acep + ace_size) >
                    ((caddr_t)aclnode->z_acldata + aclnode->z_size)) {
                        return (NULL);
                }
 
-               *iflags = aclp->z_ops.ace_flags_get(acep);
-               *type = aclp->z_ops.ace_type_get(acep);
-               *access_mask = aclp->z_ops.ace_mask_get(acep);
-               *who = aclp->z_ops.ace_who_get(acep);
+               *iflags = aclp->z_ops->ace_flags_get(acep);
+               *type = aclp->z_ops->ace_type_get(acep);
+               *access_mask = aclp->z_ops->ace_mask_get(acep);
+               *who = aclp->z_ops->ace_who_get(acep);
                aclp->z_next_ace = (caddr_t)aclp->z_next_ace + ace_size;
                aclnode->z_ace_idx++;
+
                return ((void *)acep);
        }
        return (NULL);
@@ -528,21 +643,14 @@ zfs_ace_walk(void *datap, uint64_t cookie, int aclcnt,
        return ((uint64_t)(uintptr_t)acep);
 }
 
-static zfs_acl_node_t *
-zfs_acl_curr_node(zfs_acl_t *aclp)
-{
-       ASSERT(aclp->z_curr_node);
-       return (aclp->z_curr_node);
-}
-
 /*
  * Copy ACE to internal ZFS format.
  * While processing the ACL each ACE will be validated for correctness.
  * ACE FUIDs will be created later.
  */
 int
-zfs_copy_ace_2_fuid(zfsvfs_t *zfsvfs, vtype_t obj_type, zfs_acl_t *aclp,
-    void *datap, zfs_ace_t *z_acl, int aclcnt, size_t *size,
+zfs_copy_ace_2_fuid(zfsvfs_t *zfsvfs, umode_t obj_mode, zfs_acl_t *aclp,
+    void *datap, zfs_ace_t *z_acl, uint64_t aclcnt, size_t *size,
     zfs_fuid_info_t **fuidp, cred_t *cr)
 {
        int i;
@@ -567,9 +675,9 @@ zfs_copy_ace_2_fuid(zfsvfs_t *zfsvfs, vtype_t obj_type, zfs_acl_t *aclp,
                /*
                 * Make sure ACE is valid
                 */
-               if (zfs_ace_valid(obj_type, aclp, aceptr->z_hdr.z_type,
+               if (zfs_ace_valid(obj_mode, aclp, aceptr->z_hdr.z_type,
                    aceptr->z_hdr.z_flags) != B_TRUE)
-                       return (EINVAL);
+                       return (SET_ERROR(EINVAL));
 
                switch (acep->a_type) {
                case ACE_ACCESS_ALLOWED_OBJECT_ACE_TYPE:
@@ -591,7 +699,7 @@ zfs_copy_ace_2_fuid(zfsvfs_t *zfsvfs, vtype_t obj_type, zfs_acl_t *aclp,
                }
 
                aceptr = (zfs_ace_t *)((caddr_t)aceptr +
-                   aclp->z_ops.ace_size(aceptr));
+                   aclp->z_ops->ace_size(aceptr));
        }
 
        *size = (caddr_t)aceptr - (caddr_t)z_acl;
@@ -616,8 +724,8 @@ zfs_copy_fuid_2_ace(zfsvfs_t *zfsvfs, zfs_acl_t *aclp, cred_t *cr,
        size_t ace_size;
        uint16_t entry_type;
 
-       while (zacep = zfs_acl_next_ace(aclp, zacep,
-           &who, &access_mask, &iflags, &type)) {
+       while ((zacep = zfs_acl_next_ace(aclp, zacep,
+           &who, &access_mask, &iflags, &type))) {
 
                switch (type) {
                case ACE_ACCESS_ALLOWED_OBJECT_ACE_TYPE:
@@ -660,7 +768,7 @@ zfs_copy_fuid_2_ace(zfsvfs_t *zfsvfs, zfs_acl_t *aclp, cred_t *cr,
 }
 
 static int
-zfs_copy_ace_2_oldace(vtype_t obj_type, zfs_acl_t *aclp, ace_t *acep,
+zfs_copy_ace_2_oldace(umode_t obj_mode, zfs_acl_t *aclp, ace_t *acep,
     zfs_oldace_t *z_acl, int aclcnt, size_t *size)
 {
        int i;
@@ -674,9 +782,9 @@ zfs_copy_ace_2_oldace(vtype_t obj_type, zfs_acl_t *aclp, ace_t *acep,
                /*
                 * Make sure ACE is valid
                 */
-               if (zfs_ace_valid(obj_type, aclp, aceptr->z_type,
+               if (zfs_ace_valid(obj_mode, aclp, aceptr->z_type,
                    aceptr->z_flags) != B_TRUE)
-                       return (EINVAL);
+                       return (SET_ERROR(EINVAL));
        }
        *size = (caddr_t)aceptr - (caddr_t)z_acl;
        return (0);
@@ -707,8 +815,8 @@ zfs_acl_xform(znode_t *zp, zfs_acl_t *aclp, cred_t *cr)
        oldaclp = kmem_alloc(sizeof (zfs_oldace_t) * aclp->z_acl_count,
            KM_SLEEP);
        i = 0;
-       while (cookie = zfs_acl_next_ace(aclp, cookie, &who,
-           &access_mask, &iflags, &type)) {
+       while ((cookie = zfs_acl_next_ace(aclp, cookie, &who,
+           &access_mask, &iflags, &type))) {
                oldaclp[i].z_flags = iflags;
                oldaclp[i].z_type = type;
                oldaclp[i].z_fuid = who;
@@ -717,9 +825,9 @@ zfs_acl_xform(znode_t *zp, zfs_acl_t *aclp, cred_t *cr)
 
        newaclnode = zfs_acl_node_alloc(aclp->z_acl_count *
            sizeof (zfs_object_ace_t));
-       aclp->z_ops = zfs_acl_fuid_ops;
-       VERIFY(zfs_copy_ace_2_fuid(zp->z_zfsvfs, ZTOV(zp)->v_type, aclp,
-           oldaclp, newaclnode->z_acldata, aclp->z_acl_count,
+       aclp->z_ops = &zfs_acl_fuid_ops;
+       VERIFY(zfs_copy_ace_2_fuid(ZTOZSB(zp), ZTOI(zp)->i_mode,
+           aclp, oldaclp, newaclnode->z_acldata, aclp->z_acl_count,
            &newaclnode->z_size, NULL, cr) == 0);
        newaclnode->z_ace_count = aclp->z_acl_count;
        aclp->z_version = ZFS_ACL_VERSION;
@@ -761,20 +869,21 @@ zfs_set_ace(zfs_acl_t *aclp, void *acep, uint32_t access_mask,
 {
        uint16_t type = entry_type & ACE_TYPE_FLAGS;
 
-       aclp->z_ops.ace_mask_set(acep, access_mask);
-       aclp->z_ops.ace_type_set(acep, access_type);
-       aclp->z_ops.ace_flags_set(acep, entry_type);
+       aclp->z_ops->ace_mask_set(acep, access_mask);
+       aclp->z_ops->ace_type_set(acep, access_type);
+       aclp->z_ops->ace_flags_set(acep, entry_type);
        if ((type != ACE_OWNER && type != OWNING_GROUP &&
            type != ACE_EVERYONE))
-               aclp->z_ops.ace_who_set(acep, fuid);
+               aclp->z_ops->ace_who_set(acep, fuid);
 }
 
 /*
  * Determine mode of file based on ACL.
  * Also, create FUIDs for any User/Group ACEs
  */
-static uint64_t
-zfs_mode_compute(znode_t *zp, zfs_acl_t *aclp)
+uint64_t
+zfs_mode_compute(uint64_t fmode, zfs_acl_t *aclp,
+    uint64_t *pflags, uint64_t fuid, uint64_t fgid)
 {
        int             entry_type;
        mode_t          mode;
@@ -785,10 +894,10 @@ zfs_mode_compute(znode_t *zp, zfs_acl_t *aclp)
        uint32_t        access_mask;
        boolean_t       an_exec_denied = B_FALSE;
 
-       mode = (zp->z_phys->zp_mode & (S_IFMT | S_ISUID | S_ISGID | S_ISVTX));
+       mode = (fmode & (S_IFMT | S_ISUID | S_ISGID | S_ISVTX));
 
-       while (acep = zfs_acl_next_ace(aclp, acep, &who,
-           &access_mask, &iflags, &type)) {
+       while ((acep = zfs_acl_next_ace(aclp, acep, &who,
+           &access_mask, &iflags, &type))) {
 
                if (!zfs_acl_valid_ace_type(type, iflags))
                        continue;
@@ -803,7 +912,8 @@ zfs_mode_compute(znode_t *zp, zfs_acl_t *aclp)
                    entry_type == OWNING_GROUP))
                        continue;
 
-               if (entry_type == ACE_OWNER) {
+               if (entry_type == ACE_OWNER || (entry_type == 0 &&
+                   who == fuid)) {
                        if ((access_mask & ACE_READ_DATA) &&
                            (!(seen & S_IRUSR))) {
                                seen |= S_IRUSR;
@@ -825,7 +935,8 @@ zfs_mode_compute(znode_t *zp, zfs_acl_t *aclp)
                                        mode |= S_IXUSR;
                                }
                        }
-               } else if (entry_type == OWNING_GROUP) {
+               } else if (entry_type == OWNING_GROUP ||
+                   (entry_type == ACE_IDENTIFIER_GROUP && who == fgid)) {
                        if ((access_mask & ACE_READ_DATA) &&
                            (!(seen & S_IRGRP))) {
                                seen |= S_IRGRP;
@@ -930,61 +1041,29 @@ zfs_mode_compute(znode_t *zp, zfs_acl_t *aclp)
                an_exec_denied = B_TRUE;
 
        if (an_exec_denied)
-               zp->z_phys->zp_flags &= ~ZFS_NO_EXECS_DENIED;
+               *pflags &= ~ZFS_NO_EXECS_DENIED;
        else
-               zp->z_phys->zp_flags |= ZFS_NO_EXECS_DENIED;
+               *pflags |= ZFS_NO_EXECS_DENIED;
 
        return (mode);
 }
 
-static zfs_acl_t *
-zfs_acl_node_read_internal(znode_t *zp, boolean_t will_modify)
-{
-       zfs_acl_t       *aclp;
-       zfs_acl_node_t  *aclnode;
-
-       aclp = zfs_acl_alloc(zp->z_phys->zp_acl.z_acl_version);
-
-       /*
-        * Version 0 to 1 znode_acl_phys has the size/count fields swapped.
-        * Version 0 didn't have a size field, only a count.
-        */
-       if (zp->z_phys->zp_acl.z_acl_version == ZFS_ACL_VERSION_INITIAL) {
-               aclp->z_acl_count = zp->z_phys->zp_acl.z_acl_size;
-               aclp->z_acl_bytes = ZFS_ACL_SIZE(aclp->z_acl_count);
-       } else {
-               aclp->z_acl_count = zp->z_phys->zp_acl.z_acl_count;
-               aclp->z_acl_bytes = zp->z_phys->zp_acl.z_acl_size;
-       }
-
-       aclnode = zfs_acl_node_alloc(will_modify ? aclp->z_acl_bytes : 0);
-       aclnode->z_ace_count = aclp->z_acl_count;
-       if (will_modify) {
-               bcopy(zp->z_phys->zp_acl.z_ace_data, aclnode->z_acldata,
-                   aclp->z_acl_bytes);
-       } else {
-               aclnode->z_size = aclp->z_acl_bytes;
-               aclnode->z_acldata = &zp->z_phys->zp_acl.z_ace_data[0];
-       }
-
-       list_insert_head(&aclp->z_acl, aclnode);
-
-       return (aclp);
-}
-
 /*
  * Read an external acl object.  If the intent is to modify, always
  * create a new acl and leave any cached acl in place.
  */
-static int
-zfs_acl_node_read(znode_t *zp, zfs_acl_t **aclpp, boolean_t will_modify)
+int
+zfs_acl_node_read(struct znode *zp, boolean_t have_lock, zfs_acl_t **aclpp,
+    boolean_t will_modify)
 {
-       uint64_t extacl = zp->z_phys->zp_acl.z_acl_extern_obj;
        zfs_acl_t       *aclp;
-       size_t          aclsize;
-       size_t          acl_count;
+       int             aclsize = 0;
+       int             acl_count = 0;
        zfs_acl_node_t  *aclnode;
-       int error;
+       zfs_acl_phys_t  znode_acl;
+       int             version;
+       int             error;
+       boolean_t       drop_lock = B_FALSE;
 
        ASSERT(MUTEX_HELD(&zp->z_acl_lock));
 
@@ -993,45 +1072,234 @@ zfs_acl_node_read(znode_t *zp, zfs_acl_t **aclpp, boolean_t will_modify)
                return (0);
        }
 
-       if (zp->z_phys->zp_acl.z_acl_extern_obj == 0) {
-               *aclpp = zfs_acl_node_read_internal(zp, will_modify);
-               if (!will_modify)
-                       zp->z_acl_cached = *aclpp;
-               return (0);
+       /*
+        * close race where znode could be upgrade while trying to
+        * read the znode attributes.
+        *
+        * But this could only happen if the file isn't already an SA
+        * znode
+        */
+       if (!zp->z_is_sa && !have_lock) {
+               mutex_enter(&zp->z_lock);
+               drop_lock = B_TRUE;
        }
+       version = zfs_znode_acl_version(zp);
 
-       aclp = zfs_acl_alloc(zp->z_phys->zp_acl.z_acl_version);
-       if (zp->z_phys->zp_acl.z_acl_version == ZFS_ACL_VERSION_INITIAL) {
-               zfs_acl_phys_v0_t *zacl0 =
-                   (zfs_acl_phys_v0_t *)&zp->z_phys->zp_acl;
-
-               aclsize = ZFS_ACL_SIZE(zacl0->z_acl_count);
-               acl_count = zacl0->z_acl_count;
-       } else {
-               aclsize = zp->z_phys->zp_acl.z_acl_size;
-               acl_count = zp->z_phys->zp_acl.z_acl_count;
-               if (aclsize == 0)
-                       aclsize = acl_count * sizeof (zfs_ace_t);
+       if ((error = zfs_acl_znode_info(zp, &aclsize,
+           &acl_count, &znode_acl)) != 0) {
+               goto done;
        }
-       aclnode = zfs_acl_node_alloc(aclsize);
-       list_insert_head(&aclp->z_acl, aclnode);
-       error = dmu_read(zp->z_zfsvfs->z_os, extacl, 0,
-           aclsize, aclnode->z_acldata, DMU_READ_PREFETCH);
-       aclnode->z_ace_count = acl_count;
+
+       aclp = zfs_acl_alloc(version);
+
        aclp->z_acl_count = acl_count;
        aclp->z_acl_bytes = aclsize;
 
+       aclnode = zfs_acl_node_alloc(aclsize);
+       aclnode->z_ace_count = aclp->z_acl_count;
+       aclnode->z_size = aclsize;
+
+       if (!zp->z_is_sa) {
+               if (znode_acl.z_acl_extern_obj) {
+                       error = dmu_read(ZTOZSB(zp)->z_os,
+                           znode_acl.z_acl_extern_obj, 0, aclnode->z_size,
+                           aclnode->z_acldata, DMU_READ_PREFETCH);
+               } else {
+                       bcopy(znode_acl.z_ace_data, aclnode->z_acldata,
+                           aclnode->z_size);
+               }
+       } else {
+               error = sa_lookup(zp->z_sa_hdl, SA_ZPL_DACL_ACES(ZTOZSB(zp)),
+                   aclnode->z_acldata, aclnode->z_size);
+       }
+
        if (error != 0) {
                zfs_acl_free(aclp);
+               zfs_acl_node_free(aclnode);
                /* convert checksum errors into IO errors */
                if (error == ECKSUM)
-                       error = EIO;
-               return (error);
+                       error = SET_ERROR(EIO);
+               goto done;
        }
 
+       list_insert_head(&aclp->z_acl, aclnode);
+
        *aclpp = aclp;
        if (!will_modify)
                zp->z_acl_cached = aclp;
+done:
+       if (drop_lock)
+               mutex_exit(&zp->z_lock);
+       return (error);
+}
+
+/*ARGSUSED*/
+void
+zfs_acl_data_locator(void **dataptr, uint32_t *length, uint32_t buflen,
+    boolean_t start, void *userdata)
+{
+       zfs_acl_locator_cb_t *cb = (zfs_acl_locator_cb_t *)userdata;
+
+       if (start) {
+               cb->cb_acl_node = list_head(&cb->cb_aclp->z_acl);
+       } else {
+               cb->cb_acl_node = list_next(&cb->cb_aclp->z_acl,
+                   cb->cb_acl_node);
+       }
+       *dataptr = cb->cb_acl_node->z_acldata;
+       *length = cb->cb_acl_node->z_size;
+}
+
+int
+zfs_acl_chown_setattr(znode_t *zp)
+{
+       int error;
+       zfs_acl_t *aclp;
+
+       if (ZTOZSB(zp)->z_acl_type == ZFS_ACLTYPE_POSIXACL)
+               return (0);
+
+       ASSERT(MUTEX_HELD(&zp->z_lock));
+       ASSERT(MUTEX_HELD(&zp->z_acl_lock));
+
+       error = zfs_acl_node_read(zp, B_TRUE, &aclp, B_FALSE);
+       if (error == 0 && aclp->z_acl_count > 0)
+               zp->z_mode = ZTOI(zp)->i_mode =
+                   zfs_mode_compute(zp->z_mode, aclp,
+                   &zp->z_pflags, KUID_TO_SUID(ZTOI(zp)->i_uid),
+                   KGID_TO_SGID(ZTOI(zp)->i_gid));
+
+       /*
+        * Some ZFS implementations (ZEVO) create neither a ZNODE_ACL
+        * nor a DACL_ACES SA in which case ENOENT is returned from
+        * zfs_acl_node_read() when the SA can't be located.
+        * Allow chown/chgrp to succeed in these cases rather than
+        * returning an error that makes no sense in the context of
+        * the caller.
+        */
+       if (error == ENOENT)
+               return (0);
+
+       return (error);
+}
+
+static void
+acl_trivial_access_masks(mode_t mode, uint32_t *allow0, uint32_t *deny1,
+    uint32_t *deny2, uint32_t *owner, uint32_t *group, uint32_t *everyone)
+{
+       *deny1 = *deny2 = *allow0 = *group = 0;
+
+       if (!(mode & S_IRUSR) && (mode & (S_IRGRP|S_IROTH)))
+               *deny1 |= ACE_READ_DATA;
+       if (!(mode & S_IWUSR) && (mode & (S_IWGRP|S_IWOTH)))
+               *deny1 |= ACE_WRITE_DATA;
+       if (!(mode & S_IXUSR) && (mode & (S_IXGRP|S_IXOTH)))
+               *deny1 |= ACE_EXECUTE;
+
+       if (!(mode & S_IRGRP) && (mode & S_IROTH))
+               *deny2 = ACE_READ_DATA;
+       if (!(mode & S_IWGRP) && (mode & S_IWOTH))
+               *deny2 |= ACE_WRITE_DATA;
+       if (!(mode & S_IXGRP) && (mode & S_IXOTH))
+               *deny2 |= ACE_EXECUTE;
+
+       if ((mode & S_IRUSR) && (!(mode & S_IRGRP) && (mode & S_IROTH)))
+               *allow0 |= ACE_READ_DATA;
+       if ((mode & S_IWUSR) && (!(mode & S_IWGRP) && (mode & S_IWOTH)))
+               *allow0 |= ACE_WRITE_DATA;
+       if ((mode & S_IXUSR) && (!(mode & S_IXGRP) && (mode & S_IXOTH)))
+               *allow0 |= ACE_EXECUTE;
+
+       *owner = ACE_WRITE_ATTRIBUTES|ACE_WRITE_OWNER|ACE_WRITE_ACL|
+           ACE_WRITE_NAMED_ATTRS|ACE_READ_ACL|ACE_READ_ATTRIBUTES|
+           ACE_READ_NAMED_ATTRS|ACE_SYNCHRONIZE;
+       if (mode & S_IRUSR)
+               *owner |= ACE_READ_DATA;
+       if (mode & S_IWUSR)
+               *owner |= ACE_WRITE_DATA|ACE_APPEND_DATA;
+       if (mode & S_IXUSR)
+               *owner |= ACE_EXECUTE;
+
+       *group = ACE_READ_ACL|ACE_READ_ATTRIBUTES| ACE_READ_NAMED_ATTRS|
+           ACE_SYNCHRONIZE;
+       if (mode & S_IRGRP)
+               *group |= ACE_READ_DATA;
+       if (mode & S_IWGRP)
+               *group |= ACE_WRITE_DATA|ACE_APPEND_DATA;
+       if (mode & S_IXGRP)
+               *group |= ACE_EXECUTE;
+
+       *everyone = ACE_READ_ACL|ACE_READ_ATTRIBUTES| ACE_READ_NAMED_ATTRS|
+           ACE_SYNCHRONIZE;
+       if (mode & S_IROTH)
+               *everyone |= ACE_READ_DATA;
+       if (mode & S_IWOTH)
+               *everyone |= ACE_WRITE_DATA|ACE_APPEND_DATA;
+       if (mode & S_IXOTH)
+               *everyone |= ACE_EXECUTE;
+}
+
+/*
+ * ace_trivial:
+ * determine whether an ace_t acl is trivial
+ *
+ * Trivialness implies that the acl is composed of only
+ * owner, group, everyone entries.  ACL can't
+ * have read_acl denied, and write_owner/write_acl/write_attributes
+ * can only be owner@ entry.
+ */
+static int
+ace_trivial_common(void *acep, int aclcnt,
+    uint64_t (*walk)(void *, uint64_t, int aclcnt,
+    uint16_t *, uint16_t *, uint32_t *))
+{
+       uint16_t flags;
+       uint32_t mask;
+       uint16_t type;
+       uint64_t cookie = 0;
+
+       while ((cookie = walk(acep, cookie, aclcnt, &flags, &type, &mask))) {
+               switch (flags & ACE_TYPE_FLAGS) {
+               case ACE_OWNER:
+               case ACE_GROUP|ACE_IDENTIFIER_GROUP:
+               case ACE_EVERYONE:
+                       break;
+               default:
+                       return (1);
+               }
+
+               if (flags & (ACE_FILE_INHERIT_ACE|
+                   ACE_DIRECTORY_INHERIT_ACE|ACE_NO_PROPAGATE_INHERIT_ACE|
+                   ACE_INHERIT_ONLY_ACE))
+                       return (1);
+
+               /*
+                * Special check for some special bits
+                *
+                * Don't allow anybody to deny reading basic
+                * attributes or a files ACL.
+                */
+               if ((mask & (ACE_READ_ACL|ACE_READ_ATTRIBUTES)) &&
+                   (type == ACE_ACCESS_DENIED_ACE_TYPE))
+                       return (1);
+
+               /*
+                * Delete permissions are never set by default
+                */
+               if (mask & (ACE_DELETE|ACE_DELETE_CHILD))
+                       return (1);
+               /*
+                * only allow owner@ to have
+                * write_acl/write_owner/write_attributes/write_xattr/
+                */
+               if (type == ACE_ACCESS_ALLOWED_ACE_TYPE &&
+                   (!(flags & ACE_OWNER) && (mask &
+                   (ACE_WRITE_OWNER|ACE_WRITE_ACL| ACE_WRITE_ATTRIBUTES|
+                   ACE_WRITE_NAMED_ATTRS))))
+                       return (1);
+
+       }
+
        return (0);
 }
 
@@ -1045,28 +1313,36 @@ zfs_acl_node_read(znode_t *zp, zfs_acl_t **aclpp, boolean_t will_modify)
 int
 zfs_aclset_common(znode_t *zp, zfs_acl_t *aclp, cred_t *cr, dmu_tx_t *tx)
 {
-       int             error;
-       znode_phys_t    *zphys = zp->z_phys;
-       zfs_acl_phys_t  *zacl = &zphys->zp_acl;
-       zfsvfs_t        *zfsvfs = zp->z_zfsvfs;
-       uint64_t        aoid = zphys->zp_acl.z_acl_extern_obj;
-       uint64_t        off = 0;
-       dmu_object_type_t otype;
-       zfs_acl_node_t  *aclnode;
-
-       dmu_buf_will_dirty(zp->z_dbuf, tx);
+       int                     error;
+       zfsvfs_t                *zfsvfs = ZTOZSB(zp);
+       dmu_object_type_t       otype;
+       zfs_acl_locator_cb_t    locate = { 0 };
+       uint64_t                mode;
+       sa_bulk_attr_t          bulk[5];
+       uint64_t                ctime[2];
+       int                     count = 0;
+       zfs_acl_phys_t          acl_phys;
+
+       mode = zp->z_mode;
+
+       mode = zfs_mode_compute(mode, aclp, &zp->z_pflags,
+           KUID_TO_SUID(ZTOI(zp)->i_uid), KGID_TO_SGID(ZTOI(zp)->i_gid));
+
+       zp->z_mode = ZTOI(zp)->i_mode = mode;
+       SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_MODE(zfsvfs), NULL,
+           &mode, sizeof (mode));
+       SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_FLAGS(zfsvfs), NULL,
+           &zp->z_pflags, sizeof (zp->z_pflags));
+       SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_CTIME(zfsvfs), NULL,
+           &ctime, sizeof (ctime));
 
        if (zp->z_acl_cached) {
                zfs_acl_free(zp->z_acl_cached);
                zp->z_acl_cached = NULL;
        }
 
-       zphys->zp_mode = zfs_mode_compute(zp, aclp);
-
        /*
-        * Decide which object type to use.  If we are forced to
-        * use old ACL format then transform ACL into zfs_oldace_t
-        * layout.
+        * Upgrade needed?
         */
        if (!zfsvfs->z_use_fuids) {
                otype = DMU_OT_OLDACL;
@@ -1078,461 +1354,173 @@ zfs_aclset_common(znode_t *zp, zfs_acl_t *aclp, cred_t *cr, dmu_tx_t *tx)
                otype = DMU_OT_ACL;
        }
 
-       if (aclp->z_acl_bytes > ZFS_ACE_SPACE) {
-               /*
-                * If ACL was previously external and we are now
-                * converting to new ACL format then release old
-                * ACL object and create a new one.
-                */
-               if (aoid && aclp->z_version != zacl->z_acl_version) {
-                       error = dmu_object_free(zfsvfs->z_os,
-                           zp->z_phys->zp_acl.z_acl_extern_obj, tx);
-                       if (error)
-                               return (error);
-                       aoid = 0;
-               }
-               if (aoid == 0) {
-                       aoid = dmu_object_alloc(zfsvfs->z_os,
-                           otype, aclp->z_acl_bytes,
-                           otype == DMU_OT_ACL ? DMU_OT_SYSACL : DMU_OT_NONE,
-                           otype == DMU_OT_ACL ? DN_MAX_BONUSLEN : 0, tx);
-               } else {
-                       (void) dmu_object_set_blocksize(zfsvfs->z_os, aoid,
-                           aclp->z_acl_bytes, 0, tx);
-               }
-               zphys->zp_acl.z_acl_extern_obj = aoid;
-               for (aclnode = list_head(&aclp->z_acl); aclnode;
-                   aclnode = list_next(&aclp->z_acl, aclnode)) {
-                       if (aclnode->z_ace_count == 0)
-                               continue;
-                       dmu_write(zfsvfs->z_os, aoid, off,
-                           aclnode->z_size, aclnode->z_acldata, tx);
-                       off += aclnode->z_size;
-               }
-       } else {
-               void *start = zacl->z_ace_data;
-               /*
-                * Migrating back embedded?
-                */
-               if (zphys->zp_acl.z_acl_extern_obj) {
-                       error = dmu_object_free(zfsvfs->z_os,
-                           zp->z_phys->zp_acl.z_acl_extern_obj, tx);
-                       if (error)
-                               return (error);
-                       zphys->zp_acl.z_acl_extern_obj = 0;
-               }
-
-               for (aclnode = list_head(&aclp->z_acl); aclnode;
-                   aclnode = list_next(&aclp->z_acl, aclnode)) {
-                       if (aclnode->z_ace_count == 0)
-                               continue;
-                       bcopy(aclnode->z_acldata, start, aclnode->z_size);
-                       start = (caddr_t)start + aclnode->z_size;
-               }
-       }
-
-       /*
-        * If Old version then swap count/bytes to match old
-        * layout of znode_acl_phys_t.
-        */
-       if (aclp->z_version == ZFS_ACL_VERSION_INITIAL) {
-               zphys->zp_acl.z_acl_size = aclp->z_acl_count;
-               zphys->zp_acl.z_acl_count = aclp->z_acl_bytes;
-       } else {
-               zphys->zp_acl.z_acl_size = aclp->z_acl_bytes;
-               zphys->zp_acl.z_acl_count = aclp->z_acl_count;
-       }
-
-       zphys->zp_acl.z_acl_version = aclp->z_version;
-
        /*
-        * Replace ACL wide bits, but first clear them.
+        * Arrgh, we have to handle old on disk format
+        * as well as newer (preferred) SA format.
         */
-       zp->z_phys->zp_flags &= ~ZFS_ACL_WIDE_FLAGS;
-
-       zp->z_phys->zp_flags |= aclp->z_hints;
-
-       if (ace_trivial_common(aclp, 0, zfs_ace_walk) == 0)
-               zp->z_phys->zp_flags |= ZFS_ACL_TRIVIAL;
 
-       return (0);
-}
+       if (zp->z_is_sa) { /* the easy case, just update the ACL attribute */
+               locate.cb_aclp = aclp;
+               SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_DACL_ACES(zfsvfs),
+                   zfs_acl_data_locator, &locate, aclp->z_acl_bytes);
+               SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_DACL_COUNT(zfsvfs),
+                   NULL, &aclp->z_acl_count, sizeof (uint64_t));
+       } else { /* Painful legacy way */
+               zfs_acl_node_t *aclnode;
+               uint64_t off = 0;
+               uint64_t aoid;
+
+               if ((error = sa_lookup(zp->z_sa_hdl, SA_ZPL_ZNODE_ACL(zfsvfs),
+                   &acl_phys, sizeof (acl_phys))) != 0)
+                       return (error);
 
-/*
- * Update access mask for prepended ACE
- *
- * This applies the "groupmask" value for aclmode property.
- */
-static void
-zfs_acl_prepend_fixup(zfs_acl_t *aclp, void  *acep, void  *origacep,
-    mode_t mode, uint64_t owner)
-{
-       int     rmask, wmask, xmask;
-       int     user_ace;
-       uint16_t aceflags;
-       uint32_t origmask, acepmask;
-       uint64_t fuid;
-
-       aceflags = aclp->z_ops.ace_flags_get(acep);
-       fuid = aclp->z_ops.ace_who_get(acep);
-       origmask = aclp->z_ops.ace_mask_get(origacep);
-       acepmask = aclp->z_ops.ace_mask_get(acep);
-
-       user_ace = (!(aceflags &
-           (ACE_OWNER|ACE_GROUP|ACE_IDENTIFIER_GROUP)));
-
-       if (user_ace && (fuid == owner)) {
-               rmask = S_IRUSR;
-               wmask = S_IWUSR;
-               xmask = S_IXUSR;
-       } else {
-               rmask = S_IRGRP;
-               wmask = S_IWGRP;
-               xmask = S_IXGRP;
-       }
+               aoid = acl_phys.z_acl_extern_obj;
 
-       if (origmask & ACE_READ_DATA) {
-               if (mode & rmask) {
-                       acepmask &= ~ACE_READ_DATA;
+               if (aclp->z_acl_bytes > ZFS_ACE_SPACE) {
+                       /*
+                        * If ACL was previously external and we are now
+                        * converting to new ACL format then release old
+                        * ACL object and create a new one.
+                        */
+                       if (aoid &&
+                           aclp->z_version != acl_phys.z_acl_version) {
+                               error = dmu_object_free(zfsvfs->z_os, aoid, tx);
+                               if (error)
+                                       return (error);
+                               aoid = 0;
+                       }
+                       if (aoid == 0) {
+                               aoid = dmu_object_alloc(zfsvfs->z_os,
+                                   otype, aclp->z_acl_bytes,
+                                   otype == DMU_OT_ACL ?
+                                   DMU_OT_SYSACL : DMU_OT_NONE,
+                                   otype == DMU_OT_ACL ?
+                                   DN_OLD_MAX_BONUSLEN : 0, tx);
+                       } else {
+                               (void) dmu_object_set_blocksize(zfsvfs->z_os,
+                                   aoid, aclp->z_acl_bytes, 0, tx);
+                       }
+                       acl_phys.z_acl_extern_obj = aoid;
+                       for (aclnode = list_head(&aclp->z_acl); aclnode;
+                           aclnode = list_next(&aclp->z_acl, aclnode)) {
+                               if (aclnode->z_ace_count == 0)
+                                       continue;
+                               dmu_write(zfsvfs->z_os, aoid, off,
+                                   aclnode->z_size, aclnode->z_acldata, tx);
+                               off += aclnode->z_size;
+                       }
                } else {
-                       acepmask |= ACE_READ_DATA;
-               }
-       }
+                       void *start = acl_phys.z_ace_data;
+                       /*
+                        * Migrating back embedded?
+                        */
+                       if (acl_phys.z_acl_extern_obj) {
+                               error = dmu_object_free(zfsvfs->z_os,
+                                   acl_phys.z_acl_extern_obj, tx);
+                               if (error)
+                                       return (error);
+                               acl_phys.z_acl_extern_obj = 0;
+                       }
 
-       if (origmask & ACE_WRITE_DATA) {
-               if (mode & wmask) {
-                       acepmask &= ~ACE_WRITE_DATA;
-               } else {
-                       acepmask |= ACE_WRITE_DATA;
+                       for (aclnode = list_head(&aclp->z_acl); aclnode;
+                           aclnode = list_next(&aclp->z_acl, aclnode)) {
+                               if (aclnode->z_ace_count == 0)
+                                       continue;
+                               bcopy(aclnode->z_acldata, start,
+                                   aclnode->z_size);
+                               start = (caddr_t)start + aclnode->z_size;
+                       }
                }
-       }
-
-       if (origmask & ACE_APPEND_DATA) {
-               if (mode & wmask) {
-                       acepmask &= ~ACE_APPEND_DATA;
+               /*
+                * If Old version then swap count/bytes to match old
+                * layout of znode_acl_phys_t.
+                */
+               if (aclp->z_version == ZFS_ACL_VERSION_INITIAL) {
+                       acl_phys.z_acl_size = aclp->z_acl_count;
+                       acl_phys.z_acl_count = aclp->z_acl_bytes;
                } else {
-                       acepmask |= ACE_APPEND_DATA;
+                       acl_phys.z_acl_size = aclp->z_acl_bytes;
+                       acl_phys.z_acl_count = aclp->z_acl_count;
                }
-       }
+               acl_phys.z_acl_version = aclp->z_version;
 
-       if (origmask & ACE_EXECUTE) {
-               if (mode & xmask) {
-                       acepmask &= ~ACE_EXECUTE;
-               } else {
-                       acepmask |= ACE_EXECUTE;
-               }
+               SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_ZNODE_ACL(zfsvfs), NULL,
+                   &acl_phys, sizeof (acl_phys));
        }
-       aclp->z_ops.ace_mask_set(acep, acepmask);
-}
-
-/*
- * Apply mode to canonical six ACEs.
- */
-static void
-zfs_acl_fixup_canonical_six(zfs_acl_t *aclp, mode_t mode)
-{
-       zfs_acl_node_t *aclnode = list_tail(&aclp->z_acl);
-       void    *acep;
-       int     maskoff = aclp->z_ops.ace_mask_off();
-       size_t abstract_size = aclp->z_ops.ace_abstract_size();
-
-       ASSERT(aclnode != NULL);
-
-       acep = (void *)((caddr_t)aclnode->z_acldata +
-           aclnode->z_size - (abstract_size * 6));
 
        /*
-        * Fixup final ACEs to match the mode
+        * Replace ACL wide bits, but first clear them.
         */
+       zp->z_pflags &= ~ZFS_ACL_WIDE_FLAGS;
 
-       adjust_ace_pair_common(acep, maskoff, abstract_size,
-           (mode & 0700) >> 6);        /* owner@ */
-
-       acep = (caddr_t)acep + (abstract_size * 2);
-
-       adjust_ace_pair_common(acep, maskoff, abstract_size,
-           (mode & 0070) >> 3);        /* group@ */
-
-       acep = (caddr_t)acep + (abstract_size * 2);
-       adjust_ace_pair_common(acep, maskoff,
-           abstract_size, mode);       /* everyone@ */
-}
-
-
-static int
-zfs_acl_ace_match(zfs_acl_t *aclp, void *acep, int allow_deny,
-    int entry_type, int accessmask)
-{
-       uint32_t mask = aclp->z_ops.ace_mask_get(acep);
-       uint16_t type = aclp->z_ops.ace_type_get(acep);
-       uint16_t flags = aclp->z_ops.ace_flags_get(acep);
-
-       return (mask == accessmask && type == allow_deny &&
-           ((flags & ACE_TYPE_FLAGS) == entry_type));
-}
-
-/*
- * Can prepended ACE be reused?
- */
-static int
-zfs_reuse_deny(zfs_acl_t *aclp, void *acep, void *prevacep)
-{
-       int okay_masks;
-       uint16_t prevtype;
-       uint16_t prevflags;
-       uint16_t flags;
-       uint32_t mask, prevmask;
-
-       if (prevacep == NULL)
-               return (B_FALSE);
-
-       prevtype = aclp->z_ops.ace_type_get(prevacep);
-       prevflags = aclp->z_ops.ace_flags_get(prevacep);
-       flags = aclp->z_ops.ace_flags_get(acep);
-       mask = aclp->z_ops.ace_mask_get(acep);
-       prevmask = aclp->z_ops.ace_mask_get(prevacep);
+       zp->z_pflags |= aclp->z_hints;
 
-       if (prevtype != DENY)
-               return (B_FALSE);
-
-       if (prevflags != (flags & ACE_IDENTIFIER_GROUP))
-               return (B_FALSE);
-
-       okay_masks = (mask & OKAY_MASK_BITS);
-
-       if (prevmask & ~okay_masks)
-               return (B_FALSE);
+       if (ace_trivial_common(aclp, 0, zfs_ace_walk) == 0)
+               zp->z_pflags |= ZFS_ACL_TRIVIAL;
 
-       return (B_TRUE);
+       zfs_tstamp_update_setup(zp, STATE_CHANGED, NULL, ctime);
+       return (sa_bulk_update(zp->z_sa_hdl, bulk, count, tx));
 }
 
-
-/*
- * Insert new ACL node into chain of zfs_acl_node_t's
- *
- * This will result in two possible results.
- * 1. If the ACL is currently just a single zfs_acl_node and
- *    we are prepending the entry then current acl node will have
- *    a new node inserted above it.
- *
- * 2. If we are inserting in the middle of current acl node then
- *    the current node will be split in two and new node will be inserted
- *    in between the two split nodes.
- */
-static zfs_acl_node_t *
-zfs_acl_ace_insert(zfs_acl_t *aclp, void  *acep)
+static void
+zfs_acl_chmod(zfsvfs_t *zfsvfs, uint64_t mode, zfs_acl_t *aclp)
 {
-       zfs_acl_node_t  *newnode;
-       zfs_acl_node_t  *trailernode = NULL;
-       zfs_acl_node_t  *currnode = zfs_acl_curr_node(aclp);
-       int             curr_idx = aclp->z_curr_node->z_ace_idx;
-       int             trailer_count;
-       size_t          oldsize;
+       void            *acep = NULL;
+       uint64_t        who;
+       int             new_count, new_bytes;
+       int             ace_size;
+       int             entry_type;
+       uint16_t        iflags, type;
+       uint32_t        access_mask;
+       zfs_acl_node_t  *newnode;
+       size_t          abstract_size = aclp->z_ops->ace_abstract_size();
+       void            *zacep;
+       uint32_t        owner, group, everyone;
+       uint32_t        deny1, deny2, allow0;
 
-       newnode = zfs_acl_node_alloc(aclp->z_ops.ace_size(acep));
-       newnode->z_ace_count = 1;
+       new_count = new_bytes = 0;
 
-       oldsize = currnode->z_size;
+       acl_trivial_access_masks((mode_t)mode, &allow0, &deny1, &deny2,
+           &owner, &group, &everyone);
 
-       if (curr_idx != 1) {
-               trailernode = zfs_acl_node_alloc(0);
-               trailernode->z_acldata = acep;
+       newnode = zfs_acl_node_alloc((abstract_size * 6) + aclp->z_acl_bytes);
 
-               trailer_count = currnode->z_ace_count - curr_idx + 1;
-               currnode->z_ace_count = curr_idx - 1;
-               currnode->z_size = (caddr_t)acep - (caddr_t)currnode->z_acldata;
-               trailernode->z_size = oldsize - currnode->z_size;
-               trailernode->z_ace_count = trailer_count;
+       zacep = newnode->z_acldata;
+       if (allow0) {
+               zfs_set_ace(aclp, zacep, allow0, ALLOW, -1, ACE_OWNER);
+               zacep = (void *)((uintptr_t)zacep + abstract_size);
+               new_count++;
+               new_bytes += abstract_size;
        }
-
-       aclp->z_acl_count += 1;
-       aclp->z_acl_bytes += aclp->z_ops.ace_size(acep);
-
-       if (curr_idx == 1)
-               list_insert_before(&aclp->z_acl, currnode, newnode);
-       else
-               list_insert_after(&aclp->z_acl, currnode, newnode);
-       if (trailernode) {
-               list_insert_after(&aclp->z_acl, newnode, trailernode);
-               aclp->z_curr_node = trailernode;
-               trailernode->z_ace_idx = 1;
+       if (deny1) {
+               zfs_set_ace(aclp, zacep, deny1, DENY, -1, ACE_OWNER);
+               zacep = (void *)((uintptr_t)zacep + abstract_size);
+               new_count++;
+               new_bytes += abstract_size;
        }
-
-       return (newnode);
-}
-
-/*
- * Prepend deny ACE
- */
-static void *
-zfs_acl_prepend_deny(uint64_t uid, zfs_acl_t *aclp, void *acep,
-    mode_t mode)
-{
-       zfs_acl_node_t *aclnode;
-       void  *newacep;
-       uint64_t fuid;
-       uint16_t flags;
-
-       aclnode = zfs_acl_ace_insert(aclp, acep);
-       newacep = aclnode->z_acldata;
-       fuid = aclp->z_ops.ace_who_get(acep);
-       flags = aclp->z_ops.ace_flags_get(acep);
-       zfs_set_ace(aclp, newacep, 0, DENY, fuid, (flags & ACE_TYPE_FLAGS));
-       zfs_acl_prepend_fixup(aclp, newacep, acep, mode, uid);
-
-       return (newacep);
-}
-
-/*
- * Split an inherited ACE into inherit_only ACE
- * and original ACE with inheritance flags stripped off.
- */
-static void
-zfs_acl_split_ace(zfs_acl_t *aclp, zfs_ace_hdr_t *acep)
-{
-       zfs_acl_node_t *aclnode;
-       zfs_acl_node_t *currnode;
-       void  *newacep;
-       uint16_t type, flags;
-       uint32_t mask;
-       uint64_t fuid;
-
-       type = aclp->z_ops.ace_type_get(acep);
-       flags = aclp->z_ops.ace_flags_get(acep);
-       mask = aclp->z_ops.ace_mask_get(acep);
-       fuid = aclp->z_ops.ace_who_get(acep);
-
-       aclnode = zfs_acl_ace_insert(aclp, acep);
-       newacep = aclnode->z_acldata;
-
-       aclp->z_ops.ace_type_set(newacep, type);
-       aclp->z_ops.ace_flags_set(newacep, flags | ACE_INHERIT_ONLY_ACE);
-       aclp->z_ops.ace_mask_set(newacep, mask);
-       aclp->z_ops.ace_type_set(newacep, type);
-       aclp->z_ops.ace_who_set(newacep, fuid);
-       aclp->z_next_ace = acep;
-       flags &= ~ALL_INHERIT;
-       aclp->z_ops.ace_flags_set(acep, flags);
-       currnode = zfs_acl_curr_node(aclp);
-       ASSERT(currnode->z_ace_idx >= 1);
-       currnode->z_ace_idx -= 1;
-}
-
-/*
- * Are ACES started at index i, the canonical six ACES?
- */
-static int
-zfs_have_canonical_six(zfs_acl_t *aclp)
-{
-       void *acep;
-       zfs_acl_node_t *aclnode = list_tail(&aclp->z_acl);
-       int             i = 0;
-       size_t abstract_size = aclp->z_ops.ace_abstract_size();
-
-       ASSERT(aclnode != NULL);
-
-       if (aclnode->z_ace_count < 6)
-               return (0);
-
-       acep = (void *)((caddr_t)aclnode->z_acldata +
-           aclnode->z_size - (aclp->z_ops.ace_abstract_size() * 6));
-
-       if ((zfs_acl_ace_match(aclp, (caddr_t)acep + (abstract_size * i++),
-           DENY, ACE_OWNER, 0) &&
-           zfs_acl_ace_match(aclp, (caddr_t)acep + (abstract_size * i++),
-           ALLOW, ACE_OWNER, OWNER_ALLOW_MASK) &&
-           zfs_acl_ace_match(aclp, (caddr_t)acep + (abstract_size * i++), DENY,
-           OWNING_GROUP, 0) && zfs_acl_ace_match(aclp, (caddr_t)acep +
-           (abstract_size * i++),
-           ALLOW, OWNING_GROUP, 0) &&
-           zfs_acl_ace_match(aclp, (caddr_t)acep + (abstract_size * i++),
-           DENY, ACE_EVERYONE, EVERYONE_DENY_MASK) &&
-           zfs_acl_ace_match(aclp, (caddr_t)acep + (abstract_size * i++),
-           ALLOW, ACE_EVERYONE, EVERYONE_ALLOW_MASK))) {
-               return (1);
-       } else {
-               return (0);
+       if (deny2) {
+               zfs_set_ace(aclp, zacep, deny2, DENY, -1, OWNING_GROUP);
+               zacep = (void *)((uintptr_t)zacep + abstract_size);
+               new_count++;
+               new_bytes += abstract_size;
        }
-}
 
+       while ((acep = zfs_acl_next_ace(aclp, acep, &who, &access_mask,
+           &iflags, &type))) {
+               uint16_t inherit_flags;
 
-/*
- * Apply step 1g, to group entries
- *
- * Need to deal with corner case where group may have
- * greater permissions than owner.  If so then limit
- * group permissions, based on what extra permissions
- * group has.
- */
-static void
-zfs_fixup_group_entries(zfs_acl_t *aclp, void *acep, void *prevacep,
-    mode_t mode)
-{
-       uint32_t prevmask = aclp->z_ops.ace_mask_get(prevacep);
-       uint32_t mask = aclp->z_ops.ace_mask_get(acep);
-       uint16_t prevflags = aclp->z_ops.ace_flags_get(prevacep);
-       mode_t extramode = (mode >> 3) & 07;
-       mode_t ownermode = (mode >> 6);
-
-       if (prevflags & ACE_IDENTIFIER_GROUP) {
-
-               extramode &= ~ownermode;
+               entry_type = (iflags & ACE_TYPE_FLAGS);
+               inherit_flags = (iflags & ALL_INHERIT);
 
-               if (extramode) {
-                       if (extramode & S_IROTH) {
-                               prevmask &= ~ACE_READ_DATA;
-                               mask &= ~ACE_READ_DATA;
-                       }
-                       if (extramode & S_IWOTH) {
-                               prevmask &= ~(ACE_WRITE_DATA|ACE_APPEND_DATA);
-                               mask &= ~(ACE_WRITE_DATA|ACE_APPEND_DATA);
-                       }
-                       if (extramode & S_IXOTH) {
-                               prevmask  &= ~ACE_EXECUTE;
-                               mask &= ~ACE_EXECUTE;
-                       }
+               if ((entry_type == ACE_OWNER || entry_type == ACE_EVERYONE ||
+                   (entry_type == OWNING_GROUP)) &&
+                   ((inherit_flags & ACE_INHERIT_ONLY_ACE) == 0)) {
+                       continue;
                }
-       }
-       aclp->z_ops.ace_mask_set(acep, mask);
-       aclp->z_ops.ace_mask_set(prevacep, prevmask);
-}
-
-/*
- * Apply the chmod algorithm as described
- * in PSARC/2002/240
- */
-static void
-zfs_acl_chmod(zfsvfs_t *zfsvfs, uint64_t uid,
-    uint64_t mode, zfs_acl_t *aclp)
-{
-       void            *acep = NULL, *prevacep = NULL;
-       uint64_t        who;
-       int             i;
-       int             entry_type;
-       int             reuse_deny;
-       int             need_canonical_six = 1;
-       uint16_t        iflags, type;
-       uint32_t        access_mask;
-
-       /*
-        * If discard then just discard all ACL nodes which
-        * represent the ACEs.
-        *
-        * New owner@/group@/everone@ ACEs will be added
-        * later.
-        */
-       if (zfsvfs->z_acl_mode == ZFS_ACL_DISCARD)
-               zfs_acl_release_nodes(aclp);
-
-       while (acep = zfs_acl_next_ace(aclp, acep, &who, &access_mask,
-           &iflags, &type)) {
-
-               entry_type = (iflags & ACE_TYPE_FLAGS);
-               iflags = (iflags & ALL_INHERIT);
 
                if ((type != ALLOW && type != DENY) ||
-                   (iflags & ACE_INHERIT_ONLY_ACE)) {
-                       if (iflags)
+                   (inherit_flags & ACE_INHERIT_ONLY_ACE)) {
+                       if (inherit_flags)
                                aclp->z_hints |= ZFS_INHERIT_ACE;
                        switch (type) {
                        case ACE_ACCESS_ALLOWED_OBJECT_ACE_TYPE:
@@ -1542,116 +1530,58 @@ zfs_acl_chmod(zfsvfs_t *zfsvfs, uint64_t uid,
                                aclp->z_hints |= ZFS_ACL_OBJ_ACE;
                                break;
                        }
-                       goto nextace;
-               }
-
-               /*
-                * Need to split ace into two?
-                */
-               if ((iflags & (ACE_FILE_INHERIT_ACE|
-                   ACE_DIRECTORY_INHERIT_ACE)) &&
-                   (!(iflags & ACE_INHERIT_ONLY_ACE))) {
-                       zfs_acl_split_ace(aclp, acep);
-                       aclp->z_hints |= ZFS_INHERIT_ACE;
-                       goto nextace;
-               }
-
-               if (entry_type == ACE_OWNER || entry_type == ACE_EVERYONE ||
-                   (entry_type == OWNING_GROUP)) {
-                       access_mask &= ~OGE_CLEAR;
-                       aclp->z_ops.ace_mask_set(acep, access_mask);
-                       goto nextace;
                } else {
-                       reuse_deny = B_TRUE;
-                       if (type == ALLOW) {
-
-                               /*
-                                * Check preceding ACE if any, to see
-                                * if we need to prepend a DENY ACE.
-                                * This is only applicable when the acl_mode
-                                * property == groupmask.
-                                */
-                               if (zfsvfs->z_acl_mode == ZFS_ACL_GROUPMASK) {
-
-                                       reuse_deny = zfs_reuse_deny(aclp, acep,
-                                           prevacep);
-
-                                       if (!reuse_deny) {
-                                               prevacep =
-                                                   zfs_acl_prepend_deny(uid,
-                                                   aclp, acep, mode);
-                                       } else {
-                                               zfs_acl_prepend_fixup(
-                                                   aclp, prevacep,
-                                                   acep, mode, uid);
-                                       }
-                                       zfs_fixup_group_entries(aclp, acep,
-                                           prevacep, mode);
-                               }
-                       }
-               }
-nextace:
-               prevacep = acep;
-       }
-
-       /*
-        * Check out last six aces, if we have six.
-        */
 
-       if (aclp->z_acl_count >= 6) {
-               if (zfs_have_canonical_six(aclp)) {
-                       need_canonical_six = 0;
+                       /*
+                        * Limit permissions to be no greater than
+                        * group permissions
+                        */
+                       if (zfsvfs->z_acl_inherit == ZFS_ACL_RESTRICTED) {
+                               if (!(mode & S_IRGRP))
+                                       access_mask &= ~ACE_READ_DATA;
+                               if (!(mode & S_IWGRP))
+                                       access_mask &=
+                                           ~(ACE_WRITE_DATA|ACE_APPEND_DATA);
+                               if (!(mode & S_IXGRP))
+                                       access_mask &= ~ACE_EXECUTE;
+                               access_mask &=
+                                   ~(ACE_WRITE_OWNER|ACE_WRITE_ACL|
+                                   ACE_WRITE_ATTRIBUTES|ACE_WRITE_NAMED_ATTRS);
+                       }
                }
-       }
-
-       if (need_canonical_six) {
-               size_t abstract_size = aclp->z_ops.ace_abstract_size();
-               void *zacep;
-               zfs_acl_node_t *aclnode =
-                   zfs_acl_node_alloc(abstract_size * 6);
-
-               aclnode->z_size = abstract_size * 6;
-               aclnode->z_ace_count = 6;
-               aclp->z_acl_bytes += aclnode->z_size;
-               list_insert_tail(&aclp->z_acl, aclnode);
-
-               zacep = aclnode->z_acldata;
-
-               i = 0;
-               zfs_set_ace(aclp, (caddr_t)zacep + (abstract_size * i++),
-                   0, DENY, -1, ACE_OWNER);
-               zfs_set_ace(aclp, (caddr_t)zacep + (abstract_size * i++),
-                   OWNER_ALLOW_MASK, ALLOW, -1, ACE_OWNER);
-               zfs_set_ace(aclp, (caddr_t)zacep + (abstract_size * i++), 0,
-                   DENY, -1, OWNING_GROUP);
-               zfs_set_ace(aclp, (caddr_t)zacep + (abstract_size * i++), 0,
-                   ALLOW, -1, OWNING_GROUP);
-               zfs_set_ace(aclp, (caddr_t)zacep + (abstract_size * i++),
-                   EVERYONE_DENY_MASK, DENY, -1, ACE_EVERYONE);
-               zfs_set_ace(aclp, (caddr_t)zacep + (abstract_size * i++),
-                   EVERYONE_ALLOW_MASK, ALLOW, -1, ACE_EVERYONE);
-               aclp->z_acl_count += 6;
-       }
-
-       zfs_acl_fixup_canonical_six(aclp, mode);
+               zfs_set_ace(aclp, zacep, access_mask, type, who, iflags);
+               ace_size = aclp->z_ops->ace_size(acep);
+               zacep = (void *)((uintptr_t)zacep + ace_size);
+               new_count++;
+               new_bytes += ace_size;
+       }
+       zfs_set_ace(aclp, zacep, owner, 0, -1, ACE_OWNER);
+       zacep = (void *)((uintptr_t)zacep + abstract_size);
+       zfs_set_ace(aclp, zacep, group, 0, -1, OWNING_GROUP);
+       zacep = (void *)((uintptr_t)zacep + abstract_size);
+       zfs_set_ace(aclp, zacep, everyone, 0, -1, ACE_EVERYONE);
+
+       new_count += 3;
+       new_bytes += abstract_size * 3;
+       zfs_acl_release_nodes(aclp);
+       aclp->z_acl_count = new_count;
+       aclp->z_acl_bytes = new_bytes;
+       newnode->z_ace_count = new_count;
+       newnode->z_size = new_bytes;
+       list_insert_tail(&aclp->z_acl, newnode);
 }
 
-int
+void
 zfs_acl_chmod_setattr(znode_t *zp, zfs_acl_t **aclp, uint64_t mode)
 {
-       int error;
-
-       mutex_enter(&zp->z_lock);
        mutex_enter(&zp->z_acl_lock);
-       *aclp = NULL;
-       error = zfs_acl_node_read(zp, aclp, B_TRUE);
-       if (error == 0) {
-               (*aclp)->z_hints = zp->z_phys->zp_flags & V4_ACL_WIDE_FLAGS;
-               zfs_acl_chmod(zp->z_zfsvfs, zp->z_phys->zp_uid, mode, *aclp);
-       }
-       mutex_exit(&zp->z_acl_lock);
+       mutex_enter(&zp->z_lock);
+       *aclp = zfs_acl_alloc(zfs_acl_version_zp(zp));
+       (*aclp)->z_hints = zp->z_pflags & V4_ACL_WIDE_FLAGS;
+       zfs_acl_chmod(ZTOZSB(zp), mode, *aclp);
        mutex_exit(&zp->z_lock);
-       return (error);
+       mutex_exit(&zp->z_acl_lock);
+       ASSERT(*aclp);
 }
 
 /*
@@ -1660,12 +1590,12 @@ zfs_acl_chmod_setattr(znode_t *zp, zfs_acl_t **aclp, uint64_t mode)
 static void
 zfs_restricted_update(zfsvfs_t *zfsvfs, zfs_acl_t *aclp, void *acep)
 {
-       uint32_t mask = aclp->z_ops.ace_mask_get(acep);
+       uint32_t mask = aclp->z_ops->ace_mask_get(acep);
 
        if ((zfsvfs->z_acl_inherit == ZFS_ACL_RESTRICTED) &&
-           (aclp->z_ops.ace_type_get(acep) == ALLOW)) {
+           (aclp->z_ops->ace_type_get(acep) == ALLOW)) {
                mask &= ~RESTRICTED_CLEAR;
-               aclp->z_ops.ace_mask_set(acep, mask);
+               aclp->z_ops->ace_mask_set(acep, mask);
        }
 }
 
@@ -1673,14 +1603,14 @@ zfs_restricted_update(zfsvfs_t *zfsvfs, zfs_acl_t *aclp, void *acep)
  * Should ACE be inherited?
  */
 static int
-zfs_ace_can_use(vtype_t vtype, uint16_t acep_flags)
+zfs_ace_can_use(umode_t obj_mode, uint16_t acep_flags)
 {
        int     iflags = (acep_flags & 0xf);
 
-       if ((vtype == VDIR) && (iflags & ACE_DIRECTORY_INHERIT_ACE))
+       if (S_ISDIR(obj_mode) && (iflags & ACE_DIRECTORY_INHERIT_ACE))
                return (1);
        else if (iflags & ACE_FILE_INHERIT_ACE)
-               return (!((vtype == VDIR) &&
+               return (!(S_ISDIR(obj_mode) &&
                    (iflags & ACE_NO_PROPAGATE_INHERIT_ACE)));
        return (0);
 }
@@ -1689,12 +1619,12 @@ zfs_ace_can_use(vtype_t vtype, uint16_t acep_flags)
  * inherit inheritable ACEs from parent
  */
 static zfs_acl_t *
-zfs_acl_inherit(zfsvfs_t *zfsvfs, vtype_t vtype, zfs_acl_t *paclp,
+zfs_acl_inherit(zfsvfs_t *zfsvfs, umode_t obj_mode, zfs_acl_t *paclp,
     uint64_t mode, boolean_t *need_chmod)
 {
        void            *pacep;
-       void            *acep, *acep2;
-       zfs_acl_node_t  *aclnode, *aclnode2;
+       void            *acep;
+       zfs_acl_node_t  *aclnode;
        zfs_acl_t       *aclp = NULL;
        uint64_t        who;
        uint32_t        access_mask;
@@ -1702,8 +1632,8 @@ zfs_acl_inherit(zfsvfs_t *zfsvfs, vtype_t vtype, zfs_acl_t *paclp,
        size_t          ace_size;
        void            *data1, *data2;
        size_t          data1sz, data2sz;
-       boolean_t       vdir = vtype == VDIR;
-       boolean_t       vreg = vtype == VREG;
+       boolean_t       vdir = S_ISDIR(obj_mode);
+       boolean_t       vreg = S_ISREG(obj_mode);
        boolean_t       passthrough, passthrough_x, noallow;
 
        passthrough_x =
@@ -1716,10 +1646,10 @@ zfs_acl_inherit(zfsvfs_t *zfsvfs, vtype_t vtype, zfs_acl_t *paclp,
        *need_chmod = B_TRUE;
        pacep = NULL;
        aclp = zfs_acl_alloc(paclp->z_version);
-       if (zfsvfs->z_acl_inherit == ZFS_ACL_DISCARD)
+       if (zfsvfs->z_acl_inherit == ZFS_ACL_DISCARD || S_ISLNK(obj_mode))
                return (aclp);
-       while (pacep = zfs_acl_next_ace(paclp, pacep, &who,
-           &access_mask, &iflags, &type)) {
+       while ((pacep = zfs_acl_next_ace(paclp, pacep, &who,
+           &access_mask, &iflags, &type))) {
 
                /*
                 * don't inherit bogus ACEs
@@ -1730,9 +1660,9 @@ zfs_acl_inherit(zfsvfs_t *zfsvfs, vtype_t vtype, zfs_acl_t *paclp,
                if (noallow && type == ALLOW)
                        continue;
 
-               ace_size = aclp->z_ops.ace_size(pacep);
+               ace_size = aclp->z_ops->ace_size(pacep);
 
-               if (!zfs_ace_can_use(vtype, iflags))
+               if (!zfs_ace_can_use(obj_mode, iflags))
                        continue;
 
                /*
@@ -1745,11 +1675,11 @@ zfs_acl_inherit(zfsvfs_t *zfsvfs, vtype_t vtype, zfs_acl_t *paclp,
                    OWNING_GROUP)) && (vreg || (vdir && (iflags &
                    ACE_DIRECTORY_INHERIT_ACE)))) {
                        *need_chmod = B_FALSE;
+               }
 
-                       if (!vdir && passthrough_x &&
-                           ((mode & (S_IXUSR | S_IXGRP | S_IXOTH)) == 0)) {
-                               access_mask &= ~ACE_EXECUTE;
-                       }
+               if (!vdir && passthrough_x &&
+                   ((mode & (S_IXUSR | S_IXGRP | S_IXOTH)) == 0)) {
+                       access_mask &= ~ACE_EXECUTE;
                }
 
                aclnode = zfs_acl_node_alloc(ace_size);
@@ -1762,22 +1692,23 @@ zfs_acl_inherit(zfsvfs_t *zfsvfs, vtype_t vtype, zfs_acl_t *paclp,
                /*
                 * Copy special opaque data if any
                 */
-               if ((data1sz = paclp->z_ops.ace_data(pacep, &data1)) != 0) {
-                       VERIFY((data2sz = aclp->z_ops.ace_data(acep,
+               if ((data1sz = paclp->z_ops->ace_data(pacep, &data1)) != 0) {
+                       VERIFY((data2sz = aclp->z_ops->ace_data(acep,
                            &data2)) == data1sz);
                        bcopy(data1, data2, data2sz);
                }
+
                aclp->z_acl_count++;
                aclnode->z_ace_count++;
                aclp->z_acl_bytes += aclnode->z_size;
-               newflags = aclp->z_ops.ace_flags_get(acep);
+               newflags = aclp->z_ops->ace_flags_get(acep);
 
                if (vdir)
                        aclp->z_hints |= ZFS_INHERIT_ACE;
 
                if ((iflags & ACE_NO_PROPAGATE_INHERIT_ACE) || !vdir) {
                        newflags &= ~ALL_INHERIT;
-                       aclp->z_ops.ace_flags_set(acep,
+                       aclp->z_ops->ace_flags_set(acep,
                            newflags|ACE_INHERITED_ACE);
                        zfs_restricted_update(zfsvfs, aclp, acep);
                        continue;
@@ -1785,39 +1716,18 @@ zfs_acl_inherit(zfsvfs_t *zfsvfs, vtype_t vtype, zfs_acl_t *paclp,
 
                ASSERT(vdir);
 
-               newflags = aclp->z_ops.ace_flags_get(acep);
+               /*
+                * If only FILE_INHERIT is set then turn on
+                * inherit_only
+                */
                if ((iflags & (ACE_FILE_INHERIT_ACE |
-                   ACE_DIRECTORY_INHERIT_ACE)) !=
-                   ACE_FILE_INHERIT_ACE) {
-                       aclnode2 = zfs_acl_node_alloc(ace_size);
-                       list_insert_tail(&aclp->z_acl, aclnode2);
-                       acep2 = aclnode2->z_acldata;
-                       zfs_set_ace(aclp, acep2,
-                           access_mask, type, who,
-                           iflags|ACE_INHERITED_ACE);
+                   ACE_DIRECTORY_INHERIT_ACE)) == ACE_FILE_INHERIT_ACE) {
                        newflags |= ACE_INHERIT_ONLY_ACE;
-                       aclp->z_ops.ace_flags_set(acep, newflags);
-                       newflags &= ~ALL_INHERIT;
-                       aclp->z_ops.ace_flags_set(acep2,
+                       aclp->z_ops->ace_flags_set(acep,
                            newflags|ACE_INHERITED_ACE);
-
-                       /*
-                        * Copy special opaque data if any
-                        */
-                       if ((data1sz = aclp->z_ops.ace_data(acep,
-                           &data1)) != 0) {
-                               VERIFY((data2sz =
-                                   aclp->z_ops.ace_data(acep2,
-                                   &data2)) == data1sz);
-                               bcopy(data1, data2, data1sz);
-                       }
-                       aclp->z_acl_count++;
-                       aclnode2->z_ace_count++;
-                       aclp->z_acl_bytes += aclnode->z_size;
-                       zfs_restricted_update(zfsvfs, aclp, acep2);
                } else {
-                       newflags |= ACE_INHERIT_ONLY_ACE;
-                       aclp->z_ops.ace_flags_set(acep,
+                       newflags &= ~ACE_INHERIT_ONLY_ACE;
+                       aclp->z_ops->ace_flags_set(acep,
                            newflags|ACE_INHERITED_ACE);
                }
        }
@@ -1833,30 +1743,32 @@ zfs_acl_ids_create(znode_t *dzp, int flag, vattr_t *vap, cred_t *cr,
     vsecattr_t *vsecp, zfs_acl_ids_t *acl_ids)
 {
        int             error;
-       zfsvfs_t        *zfsvfs = dzp->z_zfsvfs;
+       zfsvfs_t        *zfsvfs = ZTOZSB(dzp);
        zfs_acl_t       *paclp;
-       gid_t           gid;
+       gid_t           gid = vap->va_gid;
        boolean_t       need_chmod = B_TRUE;
+       boolean_t       inherited = B_FALSE;
 
        bzero(acl_ids, sizeof (zfs_acl_ids_t));
-       acl_ids->z_mode = MAKEIMODE(vap->va_type, vap->va_mode);
+       acl_ids->z_mode = vap->va_mode;
 
        if (vsecp)
-               if ((error = zfs_vsec_2_aclp(zfsvfs, vap->va_type, vsecp, cr,
-                   &acl_ids->z_fuidp, &acl_ids->z_aclp)) != 0)
+               if ((error = zfs_vsec_2_aclp(zfsvfs, vap->va_mode, vsecp,
+                   cr, &acl_ids->z_fuidp, &acl_ids->z_aclp)) != 0)
                        return (error);
 
+       acl_ids->z_fuid = vap->va_uid;
+       acl_ids->z_fgid = vap->va_gid;
+#ifdef HAVE_KSID
        /*
         * Determine uid and gid.
         */
-       if ((flag & (IS_ROOT_NODE | IS_REPLAY)) ||
-           ((flag & IS_XATTR) && (vap->va_type == VDIR))) {
-               acl_ids->z_fuid = zfs_fuid_create(zfsvfs,
-                   (uint64_t)vap->va_uid, cr,
-                   ZFS_OWNER, &acl_ids->z_fuidp);
-               acl_ids->z_fgid = zfs_fuid_create(zfsvfs,
-                   (uint64_t)vap->va_gid, cr,
-                   ZFS_GROUP, &acl_ids->z_fuidp);
+       if ((flag & IS_ROOT_NODE) || zfsvfs->z_replay ||
+           ((flag & IS_XATTR) && (S_ISDIR(vap->va_mode)))) {
+               acl_ids->z_fuid = zfs_fuid_create(zfsvfs, (uint64_t)vap->va_uid,
+                   cr, ZFS_OWNER, &acl_ids->z_fuidp);
+               acl_ids->z_fgid = zfs_fuid_create(zfsvfs, (uint64_t)vap->va_gid,
+                   cr, ZFS_GROUP, &acl_ids->z_fuidp);
                gid = vap->va_gid;
        } else {
                acl_ids->z_fuid = zfs_fuid_create_cred(zfsvfs, ZFS_OWNER,
@@ -1867,16 +1779,32 @@ zfs_acl_ids_create(znode_t *dzp, int flag, vattr_t *vap, cred_t *cr,
                            (uint64_t)vap->va_gid,
                            cr, ZFS_GROUP, &acl_ids->z_fuidp);
                        gid = vap->va_gid;
-                       if (acl_ids->z_fgid != dzp->z_phys->zp_gid &&
+                       if (acl_ids->z_fgid != KGID_TO_SGID(ZTOI(dzp)->i_gid) &&
                            !groupmember(vap->va_gid, cr) &&
                            secpolicy_vnode_create_gid(cr) != 0)
                                acl_ids->z_fgid = 0;
                }
                if (acl_ids->z_fgid == 0) {
-                       if (dzp->z_phys->zp_mode & S_ISGID) {
-                               acl_ids->z_fgid = dzp->z_phys->zp_gid;
+                       if (dzp->z_mode & S_ISGID) {
+                               char            *domain;
+                               uint32_t        rid;
+
+                               acl_ids->z_fgid = KGID_TO_SGID(
+                                   ZTOI(dzp)->i_gid);
                                gid = zfs_fuid_map_id(zfsvfs, acl_ids->z_fgid,
                                    cr, ZFS_GROUP);
+
+                               if (zfsvfs->z_use_fuids &&
+                                   IS_EPHEMERAL(acl_ids->z_fgid)) {
+                                       domain = zfs_fuid_idx_domain(
+                                           &zfsvfs->z_fuid_idx,
+                                           FUID_INDEX(acl_ids->z_fgid));
+                                       rid = FUID_RID(acl_ids->z_fgid);
+                                       zfs_fuid_node_add(&acl_ids->z_fuidp,
+                                           domain, rid,
+                                           FUID_INDEX(acl_ids->z_fgid),
+                                           acl_ids->z_fgid, ZFS_GROUP);
+                               }
                        } else {
                                acl_ids->z_fgid = zfs_fuid_create_cred(zfsvfs,
                                    ZFS_GROUP, cr, &acl_ids->z_fuidp);
@@ -1884,6 +1812,7 @@ zfs_acl_ids_create(znode_t *dzp, int flag, vattr_t *vap, cred_t *cr,
                        }
                }
        }
+#endif /* HAVE_KSID */
 
        /*
         * If we're creating a directory, and the parent directory has the
@@ -1892,8 +1821,8 @@ zfs_acl_ids_create(znode_t *dzp, int flag, vattr_t *vap, cred_t *cr,
         * file's new group, clear the file's set-GID bit.
         */
 
-       if (!(flag & IS_ROOT_NODE) && (dzp->z_phys->zp_mode & S_ISGID) &&
-           (vap->va_type == VDIR)) {
+       if (!(flag & IS_ROOT_NODE) && (dzp->z_mode & S_ISGID) &&
+           (S_ISDIR(vap->va_mode))) {
                acl_ids->z_mode |= S_ISGID;
        } else {
                if ((acl_ids->z_mode & S_ISGID) &&
@@ -1902,28 +1831,38 @@ zfs_acl_ids_create(znode_t *dzp, int flag, vattr_t *vap, cred_t *cr,
        }
 
        if (acl_ids->z_aclp == NULL) {
+               mutex_enter(&dzp->z_acl_lock);
                mutex_enter(&dzp->z_lock);
-               if (!(flag & IS_ROOT_NODE) && (ZTOV(dzp)->v_type == VDIR &&
-                   (dzp->z_phys->zp_flags & ZFS_INHERIT_ACE)) &&
-                   !(dzp->z_phys->zp_flags & ZFS_XATTR)) {
-                       mutex_enter(&dzp->z_acl_lock);
-                       VERIFY(0 == zfs_acl_node_read(dzp, &paclp, B_FALSE));
-                       mutex_exit(&dzp->z_acl_lock);
+               if (!(flag & IS_ROOT_NODE) && (S_ISDIR(ZTOI(dzp)->i_mode) &&
+                   (dzp->z_pflags & ZFS_INHERIT_ACE)) &&
+                   !(dzp->z_pflags & ZFS_XATTR)) {
+                       VERIFY(0 == zfs_acl_node_read(dzp, B_TRUE,
+                           &paclp, B_FALSE));
                        acl_ids->z_aclp = zfs_acl_inherit(zfsvfs,
-                           vap->va_type, paclp, acl_ids->z_mode, &need_chmod);
+                           vap->va_mode, paclp, acl_ids->z_mode, &need_chmod);
+                       inherited = B_TRUE;
                } else {
                        acl_ids->z_aclp =
                            zfs_acl_alloc(zfs_acl_version_zp(dzp));
+                       acl_ids->z_aclp->z_hints |= ZFS_ACL_TRIVIAL;
                }
                mutex_exit(&dzp->z_lock);
+               mutex_exit(&dzp->z_acl_lock);
                if (need_chmod) {
-                       acl_ids->z_aclp->z_hints = (vap->va_type == VDIR) ?
+                       acl_ids->z_aclp->z_hints |= S_ISDIR(vap->va_mode) ?
                            ZFS_ACL_AUTO_INHERIT : 0;
-                       zfs_acl_chmod(zfsvfs, acl_ids->z_fuid,
-                           acl_ids->z_mode, acl_ids->z_aclp);
+                       zfs_acl_chmod(zfsvfs, acl_ids->z_mode, acl_ids->z_aclp);
                }
        }
 
+       if (inherited || vsecp) {
+               acl_ids->z_mode = zfs_mode_compute(acl_ids->z_mode,
+                   acl_ids->z_aclp, &acl_ids->z_aclp->z_hints,
+                   acl_ids->z_fuid, acl_ids->z_fgid);
+               if (ace_trivial_common(acl_ids->z_aclp, 0, zfs_ace_walk) == 0)
+                       acl_ids->z_aclp->z_hints |= ZFS_ACL_TRIVIAL;
+       }
+
        return (0);
 }
 
@@ -1942,14 +1881,16 @@ zfs_acl_ids_free(zfs_acl_ids_t *acl_ids)
 }
 
 boolean_t
-zfs_acl_ids_overquota(zfsvfs_t *zfsvfs, zfs_acl_ids_t *acl_ids)
+zfs_acl_ids_overquota(zfsvfs_t *zv, zfs_acl_ids_t *acl_ids, uint64_t projid)
 {
-       return (zfs_usergroup_overquota(zfsvfs, B_FALSE, acl_ids->z_fuid) ||
-           zfs_usergroup_overquota(zfsvfs, B_TRUE, acl_ids->z_fgid));
+       return (zfs_id_overquota(zv, DMU_USERUSED_OBJECT, acl_ids->z_fuid) ||
+           zfs_id_overquota(zv, DMU_GROUPUSED_OBJECT, acl_ids->z_fgid) ||
+           (projid != ZFS_DEFAULT_PROJID && projid != ZFS_INVALID_PROJID &&
+           zfs_id_overquota(zv, DMU_PROJECTUSED_OBJECT, projid)));
 }
 
 /*
- * Retrieve a files ACL
+ * Retrieve a file's ACL
  */
 int
 zfs_getacl(znode_t *zp, vsecattr_t *vsecp, boolean_t skipaclchk, cred_t *cr)
@@ -1963,15 +1904,15 @@ zfs_getacl(znode_t *zp, vsecattr_t *vsecp, boolean_t skipaclchk, cred_t *cr)
        mask = vsecp->vsa_mask & (VSA_ACE | VSA_ACECNT |
            VSA_ACE_ACLFLAGS | VSA_ACE_ALLTYPES);
 
-       if (error = zfs_zaccess(zp, ACE_READ_ACL, 0, skipaclchk, cr))
-               return (error);
-
        if (mask == 0)
-               return (ENOSYS);
+               return (SET_ERROR(ENOSYS));
+
+       if ((error = zfs_zaccess(zp, ACE_READ_ACL, 0, skipaclchk, cr)))
+               return (error);
 
        mutex_enter(&zp->z_acl_lock);
 
-       error = zfs_acl_node_read(zp, &aclp, B_FALSE);
+       error = zfs_acl_node_read(zp, B_FALSE, &aclp, B_FALSE);
        if (error != 0) {
                mutex_exit(&zp->z_acl_lock);
                return (error);
@@ -1980,15 +1921,14 @@ zfs_getacl(znode_t *zp, vsecattr_t *vsecp, boolean_t skipaclchk, cred_t *cr)
        /*
         * Scan ACL to determine number of ACEs
         */
-       if ((zp->z_phys->zp_flags & ZFS_ACL_OBJ_ACE) &&
-           !(mask & VSA_ACE_ALLTYPES)) {
+       if ((zp->z_pflags & ZFS_ACL_OBJ_ACE) && !(mask & VSA_ACE_ALLTYPES)) {
                void *zacep = NULL;
                uint64_t who;
                uint32_t access_mask;
                uint16_t type, iflags;
 
-               while (zacep = zfs_acl_next_ace(aclp, zacep,
-                   &who, &access_mask, &iflags, &type)) {
+               while ((zacep = zfs_acl_next_ace(aclp, zacep,
+                   &who, &access_mask, &iflags, &type))) {
                        switch (type) {
                        case ACE_ACCESS_ALLOWED_OBJECT_ACE_TYPE:
                        case ACE_ACCESS_DENIED_OBJECT_ACE_TYPE:
@@ -2002,7 +1942,7 @@ zfs_getacl(znode_t *zp, vsecattr_t *vsecp, boolean_t skipaclchk, cred_t *cr)
                }
                vsecp->vsa_aclcnt = count;
        } else
-               count = aclp->z_acl_count;
+               count = (int)aclp->z_acl_count;
 
        if (mask & VSA_ACECNT) {
                vsecp->vsa_aclcnt = count;
@@ -2011,8 +1951,6 @@ zfs_getacl(znode_t *zp, vsecattr_t *vsecp, boolean_t skipaclchk, cred_t *cr)
        if (mask & VSA_ACE) {
                size_t aclsz;
 
-               zfs_acl_node_t *aclnode = list_head(&aclp->z_acl);
-
                aclsz = count * sizeof (ace_t) +
                    sizeof (ace_object_t) * largeace;
 
@@ -2020,20 +1958,29 @@ zfs_getacl(znode_t *zp, vsecattr_t *vsecp, boolean_t skipaclchk, cred_t *cr)
                vsecp->vsa_aclentsz = aclsz;
 
                if (aclp->z_version == ZFS_ACL_VERSION_FUID)
-                       zfs_copy_fuid_2_ace(zp->z_zfsvfs, aclp, cr,
+                       zfs_copy_fuid_2_ace(ZTOZSB(zp), aclp, cr,
                            vsecp->vsa_aclentp, !(mask & VSA_ACE_ALLTYPES));
                else {
-                       bcopy(aclnode->z_acldata, vsecp->vsa_aclentp,
-                           count * sizeof (ace_t));
+                       zfs_acl_node_t *aclnode;
+                       void *start = vsecp->vsa_aclentp;
+
+                       for (aclnode = list_head(&aclp->z_acl); aclnode;
+                           aclnode = list_next(&aclp->z_acl, aclnode)) {
+                               bcopy(aclnode->z_acldata, start,
+                                   aclnode->z_size);
+                               start = (caddr_t)start + aclnode->z_size;
+                       }
+                       ASSERT((caddr_t)start - (caddr_t)vsecp->vsa_aclentp ==
+                           aclp->z_acl_bytes);
                }
        }
        if (mask & VSA_ACE_ACLFLAGS) {
                vsecp->vsa_aclflags = 0;
-               if (zp->z_phys->zp_flags & ZFS_ACL_DEFAULTED)
+               if (zp->z_pflags & ZFS_ACL_DEFAULTED)
                        vsecp->vsa_aclflags |= ACL_DEFAULTED;
-               if (zp->z_phys->zp_flags & ZFS_ACL_PROTECTED)
+               if (zp->z_pflags & ZFS_ACL_PROTECTED)
                        vsecp->vsa_aclflags |= ACL_PROTECTED;
-               if (zp->z_phys->zp_flags & ZFS_ACL_AUTO_INHERIT)
+               if (zp->z_pflags & ZFS_ACL_AUTO_INHERIT)
                        vsecp->vsa_aclflags |= ACL_AUTO_INHERIT;
        }
 
@@ -2043,7 +1990,7 @@ zfs_getacl(znode_t *zp, vsecattr_t *vsecp, boolean_t skipaclchk, cred_t *cr)
 }
 
 int
-zfs_vsec_2_aclp(zfsvfs_t *zfsvfs, vtype_t obj_type,
+zfs_vsec_2_aclp(zfsvfs_t *zfsvfs, umode_t obj_mode,
     vsecattr_t *vsecp, cred_t *cr, zfs_fuid_info_t **fuidp, zfs_acl_t **zaclp)
 {
        zfs_acl_t *aclp;
@@ -2052,14 +1999,14 @@ zfs_vsec_2_aclp(zfsvfs_t *zfsvfs, vtype_t obj_type,
        int error;
 
        if (vsecp->vsa_aclcnt > MAX_ACL_ENTRIES || vsecp->vsa_aclcnt <= 0)
-               return (EINVAL);
+               return (SET_ERROR(EINVAL));
 
        aclp = zfs_acl_alloc(zfs_acl_version(zfsvfs->z_version));
 
        aclp->z_hints = 0;
        aclnode = zfs_acl_node_alloc(aclcnt * sizeof (zfs_object_ace_t));
        if (aclp->z_version == ZFS_ACL_VERSION_INITIAL) {
-               if ((error = zfs_copy_ace_2_oldace(obj_type, aclp,
+               if ((error = zfs_copy_ace_2_oldace(obj_mode, aclp,
                    (ace_t *)vsecp->vsa_aclentp, aclnode->z_acldata,
                    aclcnt, &aclnode->z_size)) != 0) {
                        zfs_acl_free(aclp);
@@ -2067,7 +2014,7 @@ zfs_vsec_2_aclp(zfsvfs_t *zfsvfs, vtype_t obj_type,
                        return (error);
                }
        } else {
-               if ((error = zfs_copy_ace_2_fuid(zfsvfs, obj_type, aclp,
+               if ((error = zfs_copy_ace_2_fuid(zfsvfs, obj_mode, aclp,
                    vsecp->vsa_aclentp, aclnode->z_acldata, aclcnt,
                    &aclnode->z_size, fuidp, cr)) != 0) {
                        zfs_acl_free(aclp);
@@ -2098,12 +2045,12 @@ zfs_vsec_2_aclp(zfsvfs_t *zfsvfs, vtype_t obj_type,
 }
 
 /*
- * Set a files ACL
+ * Set a file's ACL
  */
 int
 zfs_setacl(znode_t *zp, vsecattr_t *vsecp, boolean_t skipaclchk, cred_t *cr)
 {
-       zfsvfs_t        *zfsvfs = zp->z_zfsvfs;
+       zfsvfs_t        *zfsvfs = ZTOZSB(zp);
        zilog_t         *zilog = zfsvfs->z_log;
        ulong_t         mask = vsecp->vsa_mask & (VSA_ACE | VSA_ACECNT);
        dmu_tx_t        *tx;
@@ -2111,17 +2058,18 @@ zfs_setacl(znode_t *zp, vsecattr_t *vsecp, boolean_t skipaclchk, cred_t *cr)
        zfs_acl_t       *aclp;
        zfs_fuid_info_t *fuidp = NULL;
        boolean_t       fuid_dirtied;
+       uint64_t        acl_obj;
 
        if (mask == 0)
-               return (ENOSYS);
+               return (SET_ERROR(ENOSYS));
 
-       if (zp->z_phys->zp_flags & ZFS_IMMUTABLE)
-               return (EPERM);
+       if (zp->z_pflags & ZFS_IMMUTABLE)
+               return (SET_ERROR(EPERM));
 
-       if (error = zfs_zaccess(zp, ACE_WRITE_ACL, 0, skipaclchk, cr))
+       if ((error = zfs_zaccess(zp, ACE_WRITE_ACL, 0, skipaclchk, cr)))
                return (error);
 
-       error = zfs_vsec_2_aclp(zfsvfs, ZTOV(zp)->v_type, vsecp, cr, &fuidp,
+       error = zfs_vsec_2_aclp(zfsvfs, ZTOI(zp)->i_mode, vsecp, cr, &fuidp,
            &aclp);
        if (error)
                return (error);
@@ -2131,37 +2079,41 @@ zfs_setacl(znode_t *zp, vsecattr_t *vsecp, boolean_t skipaclchk, cred_t *cr)
         * existing flags.
         */
        if (!(vsecp->vsa_mask & VSA_ACE_ACLFLAGS)) {
-               aclp->z_hints |= (zp->z_phys->zp_flags & V4_ACL_WIDE_FLAGS);
+               aclp->z_hints |=
+                   (zp->z_pflags & V4_ACL_WIDE_FLAGS);
        }
 top:
-       mutex_enter(&zp->z_lock);
        mutex_enter(&zp->z_acl_lock);
+       mutex_enter(&zp->z_lock);
 
        tx = dmu_tx_create(zfsvfs->z_os);
-       dmu_tx_hold_bonus(tx, zp->z_id);
-
-       if (zp->z_phys->zp_acl.z_acl_extern_obj) {
-               /* Are we upgrading ACL? */
-               if (zfsvfs->z_version <= ZPL_VERSION_FUID &&
-                   zp->z_phys->zp_acl.z_acl_version ==
-                   ZFS_ACL_VERSION_INITIAL) {
-                       dmu_tx_hold_free(tx,
-                           zp->z_phys->zp_acl.z_acl_extern_obj,
-                           0, DMU_OBJECT_END);
-                       dmu_tx_hold_write(tx, DMU_NEW_OBJECT,
-                           0, aclp->z_acl_bytes);
+
+       dmu_tx_hold_sa(tx, zp->z_sa_hdl, B_TRUE);
+
+       fuid_dirtied = zfsvfs->z_fuid_dirty;
+       if (fuid_dirtied)
+               zfs_fuid_txhold(zfsvfs, tx);
+
+       /*
+        * If old version and ACL won't fit in bonus and we aren't
+        * upgrading then take out necessary DMU holds
+        */
+
+       if ((acl_obj = zfs_external_acl(zp)) != 0) {
+               if (zfsvfs->z_version >= ZPL_VERSION_FUID &&
+                   zfs_znode_acl_version(zp) <= ZFS_ACL_VERSION_INITIAL) {
+                       dmu_tx_hold_free(tx, acl_obj, 0,
+                           DMU_OBJECT_END);
+                       dmu_tx_hold_write(tx, DMU_NEW_OBJECT, 0,
+                           aclp->z_acl_bytes);
                } else {
-                       dmu_tx_hold_write(tx,
-                           zp->z_phys->zp_acl.z_acl_extern_obj,
-                           0, aclp->z_acl_bytes);
+                       dmu_tx_hold_write(tx, acl_obj, 0, aclp->z_acl_bytes);
                }
-       } else if (aclp->z_acl_bytes > ZFS_ACE_SPACE) {
+       } else if (!zp->z_is_sa && aclp->z_acl_bytes > ZFS_ACE_SPACE) {
                dmu_tx_hold_write(tx, DMU_NEW_OBJECT, 0, aclp->z_acl_bytes);
        }
-       fuid_dirtied = zfsvfs->z_fuid_dirty;
-       if (fuid_dirtied)
-               zfs_fuid_txhold(zfsvfs, tx);
 
+       zfs_sa_upgrade_txholds(tx, zp);
        error = dmu_tx_assign(tx, TXG_NOWAIT);
        if (error) {
                mutex_exit(&zp->z_acl_lock);
@@ -2179,20 +2131,20 @@ top:
 
        error = zfs_aclset_common(zp, aclp, cr, tx);
        ASSERT(error == 0);
+       ASSERT(zp->z_acl_cached == NULL);
        zp->z_acl_cached = aclp;
 
        if (fuid_dirtied)
                zfs_fuid_sync(zfsvfs, tx);
 
-       zfs_time_stamper_locked(zp, STATE_CHANGED, tx);
        zfs_log_acl(zilog, tx, zp, vsecp, fuidp);
 
        if (fuidp)
                zfs_fuid_info_free(fuidp);
        dmu_tx_commit(tx);
-done:
-       mutex_exit(&zp->z_acl_lock);
+
        mutex_exit(&zp->z_lock);
+       mutex_exit(&zp->z_acl_lock);
 
        return (error);
 }
@@ -2205,32 +2157,31 @@ done:
 static int
 zfs_zaccess_dataset_check(znode_t *zp, uint32_t v4_mode)
 {
-       if ((v4_mode & WRITE_MASK) &&
-           (zp->z_zfsvfs->z_vfs->vfs_flag & VFS_RDONLY) &&
-           (!IS_DEVVP(ZTOV(zp)) ||
-           (IS_DEVVP(ZTOV(zp)) && (v4_mode & WRITE_MASK_ATTRS)))) {
-               return (EROFS);
+       if ((v4_mode & WRITE_MASK) && (zfs_is_readonly(ZTOZSB(zp))) &&
+           (!S_ISDEV(ZTOI(zp)->i_mode) ||
+           (S_ISDEV(ZTOI(zp)->i_mode) && (v4_mode & WRITE_MASK_ATTRS)))) {
+               return (SET_ERROR(EROFS));
        }
 
        /*
         * Only check for READONLY on non-directories.
         */
        if ((v4_mode & WRITE_MASK_DATA) &&
-           (((ZTOV(zp)->v_type != VDIR) &&
-           (zp->z_phys->zp_flags & (ZFS_READONLY | ZFS_IMMUTABLE))) ||
-           (ZTOV(zp)->v_type == VDIR &&
-           (zp->z_phys->zp_flags & ZFS_IMMUTABLE)))) {
-               return (EPERM);
+           ((!S_ISDIR(ZTOI(zp)->i_mode) &&
+           (zp->z_pflags & (ZFS_READONLY | ZFS_IMMUTABLE))) ||
+           (S_ISDIR(ZTOI(zp)->i_mode) &&
+           (zp->z_pflags & ZFS_IMMUTABLE)))) {
+               return (SET_ERROR(EPERM));
        }
 
        if ((v4_mode & (ACE_DELETE | ACE_DELETE_CHILD)) &&
-           (zp->z_phys->zp_flags & ZFS_NOUNLINK)) {
-               return (EPERM);
+           (zp->z_pflags & ZFS_NOUNLINK)) {
+               return (SET_ERROR(EPERM));
        }
 
        if (((v4_mode & (ACE_READ_DATA|ACE_EXECUTE)) &&
-           (zp->z_phys->zp_flags & ZFS_AV_QUARANTINED))) {
-               return (EACCES);
+           (zp->z_pflags & ZFS_AV_QUARANTINED))) {
+               return (SET_ERROR(EACCES));
        }
 
        return (0);
@@ -2251,7 +2202,7 @@ zfs_zaccess_dataset_check(znode_t *zp, uint32_t v4_mode)
  * placed into the working_mode, giving the caller a mask of denied
  * accesses.  Returns:
  *     0               if all AoI granted
- *     EACCESS         if the denied mask is non-zero
+ *     EACCES          if the denied mask is non-zero
  *     other error     if abnormal failure (e.g., IO error)
  *
  * A secondary usage of the function is to determine if any of the
@@ -2265,38 +2216,41 @@ static int
 zfs_zaccess_aces_check(znode_t *zp, uint32_t *working_mode,
     boolean_t anyaccess, cred_t *cr)
 {
-       zfsvfs_t        *zfsvfs = zp->z_zfsvfs;
+       zfsvfs_t        *zfsvfs = ZTOZSB(zp);
        zfs_acl_t       *aclp;
        int             error;
        uid_t           uid = crgetuid(cr);
-       uint64_t        who;
+       uint64_t        who;
        uint16_t        type, iflags;
        uint16_t        entry_type;
        uint32_t        access_mask;
        uint32_t        deny_mask = 0;
        zfs_ace_hdr_t   *acep = NULL;
        boolean_t       checkit;
-       uid_t           fowner;
        uid_t           gowner;
+       uid_t           fowner;
 
        zfs_fuid_map_ids(zp, cr, &fowner, &gowner);
 
        mutex_enter(&zp->z_acl_lock);
 
-       error = zfs_acl_node_read(zp, &aclp, B_FALSE);
+       error = zfs_acl_node_read(zp, B_FALSE, &aclp, B_FALSE);
        if (error != 0) {
                mutex_exit(&zp->z_acl_lock);
                return (error);
        }
 
-       while (acep = zfs_acl_next_ace(aclp, acep, &who, &access_mask,
-           &iflags, &type)) {
+       ASSERT(zp->z_acl_cached);
+
+       while ((acep = zfs_acl_next_ace(aclp, acep, &who, &access_mask,
+           &iflags, &type))) {
                uint32_t mask_matched;
 
                if (!zfs_acl_valid_ace_type(type, iflags))
                        continue;
 
-               if (ZTOV(zp)->v_type == VDIR && (iflags & ACE_INHERIT_ONLY_ACE))
+               if (S_ISDIR(ZTOI(zp)->i_mode) &&
+                   (iflags & ACE_INHERIT_ONLY_ACE))
                        continue;
 
                /* Skip ACE if it does not affect any AoI */
@@ -2336,7 +2290,7 @@ zfs_zaccess_aces_check(znode_t *zp, uint32_t *working_mode,
                                break;
                        } else {
                                mutex_exit(&zp->z_acl_lock);
-                               return (EIO);
+                               return (SET_ERROR(EIO));
                        }
                }
 
@@ -2370,7 +2324,7 @@ zfs_zaccess_aces_check(znode_t *zp, uint32_t *working_mode,
        /* Put the found 'denies' back on the working mode */
        if (deny_mask) {
                *working_mode |= deny_mask;
-               return (EACCES);
+               return (SET_ERROR(EACCES));
        } else if (*working_mode) {
                return (-1);
        }
@@ -2388,18 +2342,11 @@ zfs_has_access(znode_t *zp, cred_t *cr)
        uint32_t have = ACE_ALL_PERMS;
 
        if (zfs_zaccess_aces_check(zp, &have, B_TRUE, cr) != 0) {
-               uid_t           owner;
+               uid_t owner;
 
-               owner = zfs_fuid_map_id(zp->z_zfsvfs,
-                   zp->z_phys->zp_uid, cr, ZFS_OWNER);
-
-               return (
-                   secpolicy_vnode_access(cr, ZTOV(zp), owner, VREAD) == 0 ||
-                   secpolicy_vnode_access(cr, ZTOV(zp), owner, VWRITE) == 0 ||
-                   secpolicy_vnode_access(cr, ZTOV(zp), owner, VEXEC) == 0 ||
-                   secpolicy_vnode_chown(cr, owner) == 0 ||
-                   secpolicy_vnode_setdac(cr, owner) == 0 ||
-                   secpolicy_vnode_remove(cr) == 0);
+               owner = zfs_fuid_map_id(ZTOZSB(zp),
+                   KUID_TO_SUID(ZTOI(zp)->i_uid), cr, ZFS_OWNER);
+               return (secpolicy_vnode_any_access(cr, ZTOI(zp), owner) == 0);
        }
        return (B_TRUE);
 }
@@ -2408,7 +2355,7 @@ static int
 zfs_zaccess_common(znode_t *zp, uint32_t v4_mode, uint32_t *working_mode,
     boolean_t *check_privs, boolean_t skipaclchk, cred_t *cr)
 {
-       zfsvfs_t *zfsvfs = zp->z_zfsvfs;
+       zfsvfs_t *zfsvfs = ZTOZSB(zp);
        int err;
 
        *working_mode = v4_mode;
@@ -2445,7 +2392,7 @@ zfs_zaccess_append(znode_t *zp, uint32_t *working_mode, boolean_t *check_privs,
     cred_t *cr)
 {
        if (*working_mode != ACE_WRITE_DATA)
-               return (EACCES);
+               return (SET_ERROR(EACCES));
 
        return (zfs_zaccess_common(zp, ACE_APPEND_DATA, working_mode,
            check_privs, B_FALSE, cr));
@@ -2457,38 +2404,34 @@ zfs_fastaccesschk_execute(znode_t *zdp, cred_t *cr)
        boolean_t owner = B_FALSE;
        boolean_t groupmbr = B_FALSE;
        boolean_t is_attr;
-       uid_t fowner;
-       uid_t gowner;
        uid_t uid = crgetuid(cr);
        int error;
 
-       if (zdp->z_phys->zp_flags & ZFS_AV_QUARANTINED)
-               return (EACCES);
+       if (zdp->z_pflags & ZFS_AV_QUARANTINED)
+               return (SET_ERROR(EACCES));
 
-       is_attr = ((zdp->z_phys->zp_flags & ZFS_XATTR) &&
-           (ZTOV(zdp)->v_type == VDIR));
+       is_attr = ((zdp->z_pflags & ZFS_XATTR) &&
+           (S_ISDIR(ZTOI(zdp)->i_mode)));
        if (is_attr)
                goto slow;
 
+
        mutex_enter(&zdp->z_acl_lock);
 
-       if (zdp->z_phys->zp_flags & ZFS_NO_EXECS_DENIED) {
+       if (zdp->z_pflags & ZFS_NO_EXECS_DENIED) {
                mutex_exit(&zdp->z_acl_lock);
                return (0);
        }
 
-       if (FUID_INDEX(zdp->z_phys->zp_uid) != 0 ||
-           FUID_INDEX(zdp->z_phys->zp_gid) != 0) {
+       if (KUID_TO_SUID(ZTOI(zdp)->i_uid) != 0 ||
+           KGID_TO_SGID(ZTOI(zdp)->i_gid) != 0) {
                mutex_exit(&zdp->z_acl_lock);
                goto slow;
        }
 
-       fowner = (uid_t)zdp->z_phys->zp_uid;
-       gowner = (uid_t)zdp->z_phys->zp_gid;
-
-       if (uid == fowner) {
+       if (uid == KUID_TO_SUID(ZTOI(zdp)->i_uid)) {
                owner = B_TRUE;
-               if (zdp->z_phys->zp_mode & S_IXUSR) {
+               if (zdp->z_mode & S_IXUSR) {
                        mutex_exit(&zdp->z_acl_lock);
                        return (0);
                } else {
@@ -2496,9 +2439,9 @@ zfs_fastaccesschk_execute(znode_t *zdp, cred_t *cr)
                        goto slow;
                }
        }
-       if (groupmember(gowner, cr)) {
+       if (groupmember(KGID_TO_SGID(ZTOI(zdp)->i_gid), cr)) {
                groupmbr = B_TRUE;
-               if (zdp->z_phys->zp_mode & S_IXGRP) {
+               if (zdp->z_mode & S_IXGRP) {
                        mutex_exit(&zdp->z_acl_lock);
                        return (0);
                } else {
@@ -2507,7 +2450,7 @@ zfs_fastaccesschk_execute(znode_t *zdp, cred_t *cr)
                }
        }
        if (!owner && !groupmbr) {
-               if (zdp->z_phys->zp_mode & S_IXOTH) {
+               if (zdp->z_mode & S_IXOTH) {
                        mutex_exit(&zdp->z_acl_lock);
                        return (0);
                }
@@ -2517,15 +2460,17 @@ zfs_fastaccesschk_execute(znode_t *zdp, cred_t *cr)
 
 slow:
        DTRACE_PROBE(zfs__fastpath__execute__access__miss);
-       ZFS_ENTER(zdp->z_zfsvfs);
+       ZFS_ENTER(ZTOZSB(zdp));
        error = zfs_zaccess(zdp, ACE_EXECUTE, 0, B_FALSE, cr);
-       ZFS_EXIT(zdp->z_zfsvfs);
+       ZFS_EXIT(ZTOZSB(zdp));
        return (error);
 }
 
 /*
- * Determine whether Access should be granted/denied, invoking least
- * priv subsytem when a deny is determined.
+ * Determine whether Access should be granted/denied.
+ *
+ * The least priv subsystem is always consulted as a basic privilege
+ * can define any form of access.
  */
 int
 zfs_zaccess(znode_t *zp, int mode, int flags, boolean_t skipaclchk, cred_t *cr)
@@ -2533,20 +2478,20 @@ zfs_zaccess(znode_t *zp, int mode, int flags, boolean_t skipaclchk, cred_t *cr)
        uint32_t        working_mode;
        int             error;
        int             is_attr;
-       zfsvfs_t        *zfsvfs = zp->z_zfsvfs;
        boolean_t       check_privs;
        znode_t         *xzp;
        znode_t         *check_zp = zp;
+       mode_t          needed_bits;
+       uid_t           owner;
 
-       is_attr = ((zp->z_phys->zp_flags & ZFS_XATTR) &&
-           (ZTOV(zp)->v_type == VDIR));
+       is_attr = ((zp->z_pflags & ZFS_XATTR) && S_ISDIR(ZTOI(zp)->i_mode));
 
        /*
         * If attribute then validate against base file
         */
        if (is_attr) {
-               if ((error = zfs_zget(zp->z_zfsvfs,
-                   zp->z_phys->zp_parent, &xzp)) != 0) {
+               if ((error = zfs_zget(ZTOZSB(zp),
+                   zp->z_xattr_parent, &xzp)) != 0) {
                        return (error);
                }
 
@@ -2567,16 +2512,42 @@ zfs_zaccess(znode_t *zp, int mode, int flags, boolean_t skipaclchk, cred_t *cr)
                }
        }
 
+       owner = zfs_fuid_map_id(ZTOZSB(zp), KUID_TO_SUID(ZTOI(zp)->i_uid),
+           cr, ZFS_OWNER);
+       /*
+        * Map the bits required to the standard inode flags
+        * S_IRUSR|S_IWUSR|S_IXUSR in the needed_bits.  Map the bits
+        * mapped by working_mode (currently missing) in missing_bits.
+        * Call secpolicy_vnode_access2() with (needed_bits & ~checkmode),
+        * needed_bits.
+        */
+       needed_bits = 0;
+
+       working_mode = mode;
+       if ((working_mode & (ACE_READ_ACL|ACE_READ_ATTRIBUTES)) &&
+           owner == crgetuid(cr))
+               working_mode &= ~(ACE_READ_ACL|ACE_READ_ATTRIBUTES);
+
+       if (working_mode & (ACE_READ_DATA|ACE_READ_NAMED_ATTRS|
+           ACE_READ_ACL|ACE_READ_ATTRIBUTES|ACE_SYNCHRONIZE))
+               needed_bits |= S_IRUSR;
+       if (working_mode & (ACE_WRITE_DATA|ACE_WRITE_NAMED_ATTRS|
+           ACE_APPEND_DATA|ACE_WRITE_ATTRIBUTES|ACE_SYNCHRONIZE))
+               needed_bits |= S_IWUSR;
+       if (working_mode & ACE_EXECUTE)
+               needed_bits |= S_IXUSR;
+
        if ((error = zfs_zaccess_common(check_zp, mode, &working_mode,
            &check_privs, skipaclchk, cr)) == 0) {
                if (is_attr)
-                       VN_RELE(ZTOV(xzp));
-               return (0);
+                       iput(ZTOI(xzp));
+               return (secpolicy_vnode_access2(cr, ZTOI(zp), owner,
+                   needed_bits, needed_bits));
        }
 
        if (error && !check_privs) {
                if (is_attr)
-                       VN_RELE(ZTOV(xzp));
+                       iput(ZTOI(xzp));
                return (error);
        }
 
@@ -2585,12 +2556,8 @@ zfs_zaccess(znode_t *zp, int mode, int flags, boolean_t skipaclchk, cred_t *cr)
        }
 
        if (error && check_privs) {
-               uid_t           owner;
                mode_t          checkmode = 0;
 
-               owner = zfs_fuid_map_id(zfsvfs, check_zp->z_phys->zp_uid, cr,
-                   ZFS_OWNER);
-
                /*
                 * First check for implicit owner permission on
                 * read_acl/read_attributes
@@ -2605,16 +2572,15 @@ zfs_zaccess(znode_t *zp, int mode, int flags, boolean_t skipaclchk, cred_t *cr)
 
                if (working_mode & (ACE_READ_DATA|ACE_READ_NAMED_ATTRS|
                    ACE_READ_ACL|ACE_READ_ATTRIBUTES|ACE_SYNCHRONIZE))
-                       checkmode |= VREAD;
+                       checkmode |= S_IRUSR;
                if (working_mode & (ACE_WRITE_DATA|ACE_WRITE_NAMED_ATTRS|
                    ACE_APPEND_DATA|ACE_WRITE_ATTRIBUTES|ACE_SYNCHRONIZE))
-                       checkmode |= VWRITE;
+                       checkmode |= S_IWUSR;
                if (working_mode & ACE_EXECUTE)
-                       checkmode |= VEXEC;
+                       checkmode |= S_IXUSR;
 
-               if (checkmode)
-                       error = secpolicy_vnode_access(cr, ZTOV(check_zp),
-                           owner, checkmode);
+               error = secpolicy_vnode_access2(cr, ZTOI(check_zp), owner,
+                   needed_bits & ~checkmode, needed_bits);
 
                if (error == 0 && (working_mode & ACE_WRITE_OWNER))
                        error = secpolicy_vnode_chown(cr, owner);
@@ -2634,19 +2600,22 @@ zfs_zaccess(znode_t *zp, int mode, int flags, boolean_t skipaclchk, cred_t *cr)
                         * for are still present.  If so then return EACCES
                         */
                        if (working_mode & ~(ZFS_CHECKED_MASKS)) {
-                               error = EACCES;
+                               error = SET_ERROR(EACCES);
                        }
                }
+       } else if (error == 0) {
+               error = secpolicy_vnode_access2(cr, ZTOI(zp), owner,
+                   needed_bits, needed_bits);
        }
 
        if (is_attr)
-               VN_RELE(ZTOV(xzp));
+               iput(ZTOI(xzp));
 
        return (error);
 }
 
 /*
- * Translate traditional unix VREAD/VWRITE/VEXEC mode into
+ * Translate traditional unix S_IRUSR/S_IWUSR/S_IXUSR mode into
  * native ACL format and call zfs_zaccess()
  */
 int
@@ -2668,15 +2637,16 @@ zfs_zaccess_unix(znode_t *zp, mode_t mode, cred_t *cr)
 
 static int
 zfs_delete_final_check(znode_t *zp, znode_t *dzp,
-    mode_t missing_perms, cred_t *cr)
+    mode_t available_perms, cred_t *cr)
 {
        int error;
        uid_t downer;
-       zfsvfs_t *zfsvfs = zp->z_zfsvfs;
 
-       downer = zfs_fuid_map_id(zfsvfs, dzp->z_phys->zp_uid, cr, ZFS_OWNER);
+       downer = zfs_fuid_map_id(ZTOZSB(dzp), KUID_TO_SUID(ZTOI(dzp)->i_uid),
+           cr, ZFS_OWNER);
 
-       error = secpolicy_vnode_access(cr, ZTOV(dzp), downer, missing_perms);
+       error = secpolicy_vnode_access2(cr, ZTOI(dzp),
+           downer, available_perms, S_IWUSR|S_IXUSR);
 
        if (error == 0)
                error = zfs_sticky_remove_access(dzp, zp, cr);
@@ -2688,7 +2658,6 @@ zfs_delete_final_check(znode_t *zp, znode_t *dzp,
  * Determine whether Access should be granted/deny, without
  * consulting least priv subsystem.
  *
- *
  * The following chart is the recommended NFSv4 enforcement for
  * ability to delete an object.
  *
@@ -2725,7 +2694,7 @@ zfs_zaccess_delete(znode_t *dzp, znode_t *zp, cred_t *cr)
        uint32_t dzp_working_mode = 0;
        uint32_t zp_working_mode = 0;
        int dzp_error, zp_error;
-       mode_t missing_perms;
+       mode_t available_perms;
        boolean_t dzpcheck_privs = B_TRUE;
        boolean_t zpcheck_privs = B_TRUE;
 
@@ -2743,8 +2712,8 @@ zfs_zaccess_delete(znode_t *dzp, znode_t *zp, cred_t *cr)
         * to determine what was found.
         */
 
-       if (zp->z_phys->zp_flags & (ZFS_IMMUTABLE | ZFS_NOUNLINK))
-               return (EPERM);
+       if (zp->z_pflags & (ZFS_IMMUTABLE | ZFS_NOUNLINK))
+               return (SET_ERROR(EPERM));
 
        /*
         * First row
@@ -2786,23 +2755,20 @@ zfs_zaccess_delete(znode_t *dzp, znode_t *zp, cred_t *cr)
         * only need to see if we have write/execute on directory.
         */
 
-       if ((dzp_error = zfs_zaccess_common(dzp, ACE_EXECUTE|ACE_WRITE_DATA,
-           &dzp_working_mode, &dzpcheck_privs, B_FALSE, cr)) == 0)
-               return (zfs_sticky_remove_access(dzp, zp, cr));
+       dzp_error = zfs_zaccess_common(dzp, ACE_EXECUTE|ACE_WRITE_DATA,
+           &dzp_working_mode, &dzpcheck_privs, B_FALSE, cr);
 
-       if (!dzpcheck_privs)
+       if (dzp_error != 0 && !dzpcheck_privs)
                return (dzp_error);
 
        /*
         * Fourth row
         */
 
-       missing_perms = (dzp_working_mode & ACE_WRITE_DATA) ? VWRITE : 0;
-       missing_perms |= (dzp_working_mode & ACE_EXECUTE) ? VEXEC : 0;
-
-       ASSERT(missing_perms);
+       available_perms = (dzp_working_mode & ACE_WRITE_DATA) ? 0 : S_IWUSR;
+       available_perms |= (dzp_working_mode & ACE_EXECUTE) ? 0 : S_IXUSR;
 
-       return (zfs_delete_final_check(zp, dzp, missing_perms, cr));
+       return (zfs_delete_final_check(zp, dzp, available_perms, cr));
 
 }
 
@@ -2813,10 +2779,10 @@ zfs_zaccess_rename(znode_t *sdzp, znode_t *szp, znode_t *tdzp,
        int add_perm;
        int error;
 
-       if (szp->z_phys->zp_flags & ZFS_AV_QUARANTINED)
-               return (EACCES);
+       if (szp->z_pflags & ZFS_AV_QUARANTINED)
+               return (SET_ERROR(EACCES));
 
-       add_perm = (ZTOV(szp)->v_type == VDIR) ?
+       add_perm = S_ISDIR(ZTOI(szp)->i_mode) ?
            ACE_ADD_SUBDIRECTORY : ACE_ADD_FILE;
 
        /*
@@ -2830,14 +2796,14 @@ zfs_zaccess_rename(znode_t *sdzp, znode_t *szp, znode_t *tdzp,
         * If that succeeds then check for add_file/add_subdir permissions
         */
 
-       if (error = zfs_zaccess_delete(sdzp, szp, cr))
+       if ((error = zfs_zaccess_delete(sdzp, szp, cr)))
                return (error);
 
        /*
         * If we have a tzp, see if we can delete it?
         */
        if (tzp) {
-               if (error = zfs_zaccess_delete(tdzp, tzp, cr))
+               if ((error = zfs_zaccess_delete(tdzp, tzp, cr)))
                        return (error);
        }