]> git.proxmox.com Git - mirror_zfs-debian.git/blame - module/zfs/zfs_fuid.c
New upstream version 0.7.2
[mirror_zfs-debian.git] / module / zfs / zfs_fuid.c
CommitLineData
34dc7c2f
BB
1/*
2 * CDDL HEADER START
3 *
4 * The contents of this file are subject to the terms of the
5 * Common Development and Distribution License (the "License").
6 * You may not use this file except in compliance with the License.
7 *
8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9 * or http://www.opensolaris.org/os/licensing.
10 * See the License for the specific language governing permissions
11 * and limitations under the License.
12 *
13 * When distributing Covered Code, include this CDDL HEADER in each
14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15 * If applicable, add the following below this CDDL HEADER, with the
16 * fields enclosed by brackets "[]" replaced with your own identifying
17 * information: Portions Copyright [yyyy] [name of copyright owner]
18 *
19 * CDDL HEADER END
20 */
21/*
428870ff 22 * Copyright (c) 2007, 2010, Oracle and/or its affiliates. All rights reserved.
34dc7c2f
BB
23 */
24
34dc7c2f 25#include <sys/zfs_context.h>
34dc7c2f
BB
26#include <sys/dmu.h>
27#include <sys/avl.h>
28#include <sys/zap.h>
29#include <sys/refcount.h>
30#include <sys/nvpair.h>
31#ifdef _KERNEL
32#include <sys/kidmap.h>
33#include <sys/sid.h>
34#include <sys/zfs_vfsops.h>
35#include <sys/zfs_znode.h>
36#endif
37#include <sys/zfs_fuid.h>
38
39/*
40 * FUID Domain table(s).
41 *
42 * The FUID table is stored as a packed nvlist of an array
43 * of nvlists which contain an index, domain string and offset
44 *
45 * During file system initialization the nvlist(s) are read and
46 * two AVL trees are created. One tree is keyed by the index number
47 * and the other by the domain string. Nodes are never removed from
9babb374 48 * trees, but new entries may be added. If a new entry is added then
cae5b340 49 * the zfsvfs->z_fuid_dirty flag is set to true and the caller will then
9babb374
BB
50 * be responsible for calling zfs_fuid_sync() to sync the changes to disk.
51 *
34dc7c2f
BB
52 */
53
54#define FUID_IDX "fuid_idx"
55#define FUID_DOMAIN "fuid_domain"
56#define FUID_OFFSET "fuid_offset"
57#define FUID_NVP_ARRAY "fuid_nvlist"
58
59typedef struct fuid_domain {
60 avl_node_t f_domnode;
61 avl_node_t f_idxnode;
62 ksiddomain_t *f_ksid;
63 uint64_t f_idx;
64} fuid_domain_t;
65
b128c09f
BB
66static char *nulldomain = "";
67
34dc7c2f
BB
68/*
69 * Compare two indexes.
70 */
71static int
72idx_compare(const void *arg1, const void *arg2)
73{
cae5b340
AX
74 const fuid_domain_t *node1 = (const fuid_domain_t *)arg1;
75 const fuid_domain_t *node2 = (const fuid_domain_t *)arg2;
34dc7c2f 76
cae5b340 77 return (AVL_CMP(node1->f_idx, node2->f_idx));
34dc7c2f
BB
78}
79
80/*
81 * Compare two domain strings.
82 */
83static int
84domain_compare(const void *arg1, const void *arg2)
85{
cae5b340
AX
86 const fuid_domain_t *node1 = (const fuid_domain_t *)arg1;
87 const fuid_domain_t *node2 = (const fuid_domain_t *)arg2;
34dc7c2f
BB
88 int val;
89
90 val = strcmp(node1->f_ksid->kd_name, node2->f_ksid->kd_name);
cae5b340
AX
91
92 return (AVL_ISIGN(val));
34dc7c2f
BB
93}
94
9babb374
BB
95void
96zfs_fuid_avl_tree_create(avl_tree_t *idx_tree, avl_tree_t *domain_tree)
97{
98 avl_create(idx_tree, idx_compare,
99 sizeof (fuid_domain_t), offsetof(fuid_domain_t, f_idxnode));
100 avl_create(domain_tree, domain_compare,
101 sizeof (fuid_domain_t), offsetof(fuid_domain_t, f_domnode));
102}
103
34dc7c2f
BB
104/*
105 * load initial fuid domain and idx trees. This function is used by
106 * both the kernel and zdb.
107 */
108uint64_t
109zfs_fuid_table_load(objset_t *os, uint64_t fuid_obj, avl_tree_t *idx_tree,
110 avl_tree_t *domain_tree)
111{
112 dmu_buf_t *db;
113 uint64_t fuid_size;
114
9babb374
BB
115 ASSERT(fuid_obj != 0);
116 VERIFY(0 == dmu_bonus_hold(os, fuid_obj,
117 FTAG, &db));
34dc7c2f
BB
118 fuid_size = *(uint64_t *)db->db_data;
119 dmu_buf_rele(db, FTAG);
120
121 if (fuid_size) {
122 nvlist_t **fuidnvp;
123 nvlist_t *nvp = NULL;
124 uint_t count;
125 char *packed;
126 int i;
127
128 packed = kmem_alloc(fuid_size, KM_SLEEP);
9babb374
BB
129 VERIFY(dmu_read(os, fuid_obj, 0,
130 fuid_size, packed, DMU_READ_PREFETCH) == 0);
34dc7c2f
BB
131 VERIFY(nvlist_unpack(packed, fuid_size,
132 &nvp, 0) == 0);
133 VERIFY(nvlist_lookup_nvlist_array(nvp, FUID_NVP_ARRAY,
134 &fuidnvp, &count) == 0);
135
136 for (i = 0; i != count; i++) {
137 fuid_domain_t *domnode;
138 char *domain;
139 uint64_t idx;
140
141 VERIFY(nvlist_lookup_string(fuidnvp[i], FUID_DOMAIN,
142 &domain) == 0);
143 VERIFY(nvlist_lookup_uint64(fuidnvp[i], FUID_IDX,
144 &idx) == 0);
145
146 domnode = kmem_alloc(sizeof (fuid_domain_t), KM_SLEEP);
147
148 domnode->f_idx = idx;
149 domnode->f_ksid = ksid_lookupdomain(domain);
150 avl_add(idx_tree, domnode);
151 avl_add(domain_tree, domnode);
152 }
153 nvlist_free(nvp);
154 kmem_free(packed, fuid_size);
155 }
156 return (fuid_size);
157}
158
159void
160zfs_fuid_table_destroy(avl_tree_t *idx_tree, avl_tree_t *domain_tree)
161{
162 fuid_domain_t *domnode;
163 void *cookie;
164
165 cookie = NULL;
c65aa5b2 166 while ((domnode = avl_destroy_nodes(domain_tree, &cookie)))
34dc7c2f
BB
167 ksiddomain_rele(domnode->f_ksid);
168
169 avl_destroy(domain_tree);
170 cookie = NULL;
c65aa5b2 171 while ((domnode = avl_destroy_nodes(idx_tree, &cookie)))
34dc7c2f
BB
172 kmem_free(domnode, sizeof (fuid_domain_t));
173 avl_destroy(idx_tree);
174}
175
176char *
177zfs_fuid_idx_domain(avl_tree_t *idx_tree, uint32_t idx)
178{
179 fuid_domain_t searchnode, *findnode;
180 avl_index_t loc;
181
182 searchnode.f_idx = idx;
183
184 findnode = avl_find(idx_tree, &searchnode, &loc);
185
b128c09f 186 return (findnode ? findnode->f_ksid->kd_name : nulldomain);
34dc7c2f
BB
187}
188
189#ifdef _KERNEL
190/*
191 * Load the fuid table(s) into memory.
192 */
193static void
cae5b340 194zfs_fuid_init(zfsvfs_t *zfsvfs)
34dc7c2f 195{
cae5b340 196 rw_enter(&zfsvfs->z_fuid_lock, RW_WRITER);
34dc7c2f 197
cae5b340
AX
198 if (zfsvfs->z_fuid_loaded) {
199 rw_exit(&zfsvfs->z_fuid_lock);
34dc7c2f
BB
200 return;
201 }
202
cae5b340 203 zfs_fuid_avl_tree_create(&zfsvfs->z_fuid_idx, &zfsvfs->z_fuid_domain);
34dc7c2f 204
cae5b340
AX
205 (void) zap_lookup(zfsvfs->z_os, MASTER_NODE_OBJ,
206 ZFS_FUID_TABLES, 8, 1, &zfsvfs->z_fuid_obj);
207 if (zfsvfs->z_fuid_obj != 0) {
208 zfsvfs->z_fuid_size = zfs_fuid_table_load(zfsvfs->z_os,
209 zfsvfs->z_fuid_obj, &zfsvfs->z_fuid_idx,
210 &zfsvfs->z_fuid_domain);
b128c09f 211 }
34dc7c2f 212
cae5b340
AX
213 zfsvfs->z_fuid_loaded = B_TRUE;
214 rw_exit(&zfsvfs->z_fuid_lock);
9babb374
BB
215}
216
217/*
218 * sync out AVL trees to persistent storage.
219 */
220void
cae5b340 221zfs_fuid_sync(zfsvfs_t *zfsvfs, dmu_tx_t *tx)
9babb374
BB
222{
223 nvlist_t *nvp;
224 nvlist_t **fuids;
225 size_t nvsize = 0;
226 char *packed;
227 dmu_buf_t *db;
228 fuid_domain_t *domnode;
229 int numnodes;
230 int i;
231
cae5b340 232 if (!zfsvfs->z_fuid_dirty) {
9babb374
BB
233 return;
234 }
235
cae5b340 236 rw_enter(&zfsvfs->z_fuid_lock, RW_WRITER);
9babb374
BB
237
238 /*
239 * First see if table needs to be created?
240 */
cae5b340
AX
241 if (zfsvfs->z_fuid_obj == 0) {
242 zfsvfs->z_fuid_obj = dmu_object_alloc(zfsvfs->z_os,
9babb374
BB
243 DMU_OT_FUID, 1 << 14, DMU_OT_FUID_SIZE,
244 sizeof (uint64_t), tx);
cae5b340 245 VERIFY(zap_add(zfsvfs->z_os, MASTER_NODE_OBJ,
9babb374 246 ZFS_FUID_TABLES, sizeof (uint64_t), 1,
cae5b340 247 &zfsvfs->z_fuid_obj, tx) == 0);
9babb374
BB
248 }
249
250 VERIFY(nvlist_alloc(&nvp, NV_UNIQUE_NAME, KM_SLEEP) == 0);
251
cae5b340 252 numnodes = avl_numnodes(&zfsvfs->z_fuid_idx);
9babb374 253 fuids = kmem_alloc(numnodes * sizeof (void *), KM_SLEEP);
cae5b340
AX
254 for (i = 0, domnode = avl_first(&zfsvfs->z_fuid_domain); domnode; i++,
255 domnode = AVL_NEXT(&zfsvfs->z_fuid_domain, domnode)) {
9babb374
BB
256 VERIFY(nvlist_alloc(&fuids[i], NV_UNIQUE_NAME, KM_SLEEP) == 0);
257 VERIFY(nvlist_add_uint64(fuids[i], FUID_IDX,
258 domnode->f_idx) == 0);
259 VERIFY(nvlist_add_uint64(fuids[i], FUID_OFFSET, 0) == 0);
260 VERIFY(nvlist_add_string(fuids[i], FUID_DOMAIN,
261 domnode->f_ksid->kd_name) == 0);
262 }
263 VERIFY(nvlist_add_nvlist_array(nvp, FUID_NVP_ARRAY,
264 fuids, numnodes) == 0);
265 for (i = 0; i != numnodes; i++)
266 nvlist_free(fuids[i]);
267 kmem_free(fuids, numnodes * sizeof (void *));
268 VERIFY(nvlist_size(nvp, &nvsize, NV_ENCODE_XDR) == 0);
269 packed = kmem_alloc(nvsize, KM_SLEEP);
270 VERIFY(nvlist_pack(nvp, &packed, &nvsize,
271 NV_ENCODE_XDR, KM_SLEEP) == 0);
272 nvlist_free(nvp);
cae5b340
AX
273 zfsvfs->z_fuid_size = nvsize;
274 dmu_write(zfsvfs->z_os, zfsvfs->z_fuid_obj, 0,
275 zfsvfs->z_fuid_size, packed, tx);
276 kmem_free(packed, zfsvfs->z_fuid_size);
277 VERIFY(0 == dmu_bonus_hold(zfsvfs->z_os, zfsvfs->z_fuid_obj,
9babb374
BB
278 FTAG, &db));
279 dmu_buf_will_dirty(db, tx);
cae5b340 280 *(uint64_t *)db->db_data = zfsvfs->z_fuid_size;
9babb374
BB
281 dmu_buf_rele(db, FTAG);
282
cae5b340
AX
283 zfsvfs->z_fuid_dirty = B_FALSE;
284 rw_exit(&zfsvfs->z_fuid_lock);
34dc7c2f
BB
285}
286
287/*
288 * Query domain table for a given domain.
289 *
9babb374 290 * If domain isn't found and addok is set, it is added to AVL trees and
cae5b340 291 * the zfsvfs->z_fuid_dirty flag will be set to TRUE. It will then be
9babb374
BB
292 * necessary for the caller or another thread to detect the dirty table
293 * and sync out the changes.
34dc7c2f
BB
294 */
295int
cae5b340 296zfs_fuid_find_by_domain(zfsvfs_t *zfsvfs, const char *domain,
9babb374 297 char **retdomain, boolean_t addok)
34dc7c2f
BB
298{
299 fuid_domain_t searchnode, *findnode;
300 avl_index_t loc;
b128c09f 301 krw_t rw = RW_READER;
34dc7c2f
BB
302
303 /*
304 * If the dummy "nobody" domain then return an index of 0
305 * to cause the created FUID to be a standard POSIX id
306 * for the user nobody.
307 */
308 if (domain[0] == '\0') {
9babb374
BB
309 if (retdomain)
310 *retdomain = nulldomain;
34dc7c2f
BB
311 return (0);
312 }
313
314 searchnode.f_ksid = ksid_lookupdomain(domain);
9babb374 315 if (retdomain)
34dc7c2f 316 *retdomain = searchnode.f_ksid->kd_name;
cae5b340
AX
317 if (!zfsvfs->z_fuid_loaded)
318 zfs_fuid_init(zfsvfs);
34dc7c2f 319
b128c09f 320retry:
cae5b340
AX
321 rw_enter(&zfsvfs->z_fuid_lock, rw);
322 findnode = avl_find(&zfsvfs->z_fuid_domain, &searchnode, &loc);
34dc7c2f
BB
323
324 if (findnode) {
cae5b340 325 rw_exit(&zfsvfs->z_fuid_lock);
34dc7c2f
BB
326 ksiddomain_rele(searchnode.f_ksid);
327 return (findnode->f_idx);
9babb374 328 } else if (addok) {
34dc7c2f 329 fuid_domain_t *domnode;
34dc7c2f 330 uint64_t retidx;
34dc7c2f 331
cae5b340
AX
332 if (rw == RW_READER && !rw_tryupgrade(&zfsvfs->z_fuid_lock)) {
333 rw_exit(&zfsvfs->z_fuid_lock);
b128c09f
BB
334 rw = RW_WRITER;
335 goto retry;
336 }
337
34dc7c2f
BB
338 domnode = kmem_alloc(sizeof (fuid_domain_t), KM_SLEEP);
339 domnode->f_ksid = searchnode.f_ksid;
340
cae5b340 341 retidx = domnode->f_idx = avl_numnodes(&zfsvfs->z_fuid_idx) + 1;
34dc7c2f 342
cae5b340
AX
343 avl_add(&zfsvfs->z_fuid_domain, domnode);
344 avl_add(&zfsvfs->z_fuid_idx, domnode);
345 zfsvfs->z_fuid_dirty = B_TRUE;
346 rw_exit(&zfsvfs->z_fuid_lock);
34dc7c2f 347 return (retidx);
9babb374 348 } else {
cae5b340 349 rw_exit(&zfsvfs->z_fuid_lock);
9babb374 350 return (-1);
34dc7c2f
BB
351 }
352}
353
354/*
355 * Query domain table by index, returning domain string
356 *
357 * Returns a pointer from an avl node of the domain string.
358 *
359 */
9babb374 360const char *
cae5b340 361zfs_fuid_find_by_idx(zfsvfs_t *zfsvfs, uint32_t idx)
34dc7c2f
BB
362{
363 char *domain;
364
cae5b340 365 if (idx == 0 || !zfsvfs->z_use_fuids)
34dc7c2f
BB
366 return (NULL);
367
cae5b340
AX
368 if (!zfsvfs->z_fuid_loaded)
369 zfs_fuid_init(zfsvfs);
34dc7c2f 370
cae5b340 371 rw_enter(&zfsvfs->z_fuid_lock, RW_READER);
b128c09f 372
cae5b340
AX
373 if (zfsvfs->z_fuid_obj || zfsvfs->z_fuid_dirty)
374 domain = zfs_fuid_idx_domain(&zfsvfs->z_fuid_idx, idx);
b128c09f
BB
375 else
376 domain = nulldomain;
cae5b340 377 rw_exit(&zfsvfs->z_fuid_lock);
34dc7c2f
BB
378
379 ASSERT(domain);
380 return (domain);
381}
382
383void
384zfs_fuid_map_ids(znode_t *zp, cred_t *cr, uid_t *uidp, uid_t *gidp)
385{
cae5b340
AX
386 *uidp = zfs_fuid_map_id(ZTOZSB(zp), KUID_TO_SUID(ZTOI(zp)->i_uid),
387 cr, ZFS_OWNER);
388 *gidp = zfs_fuid_map_id(ZTOZSB(zp), KGID_TO_SGID(ZTOI(zp)->i_gid),
389 cr, ZFS_GROUP);
34dc7c2f
BB
390}
391
392uid_t
cae5b340 393zfs_fuid_map_id(zfsvfs_t *zfsvfs, uint64_t fuid,
34dc7c2f
BB
394 cred_t *cr, zfs_fuid_type_t type)
395{
a405c8a6 396#ifdef HAVE_KSID
34dc7c2f 397 uint32_t index = FUID_INDEX(fuid);
9babb374 398 const char *domain;
34dc7c2f
BB
399 uid_t id;
400
401 if (index == 0)
402 return (fuid);
403
cae5b340 404 domain = zfs_fuid_find_by_idx(zfsvfs, index);
34dc7c2f
BB
405 ASSERT(domain != NULL);
406
407 if (type == ZFS_OWNER || type == ZFS_ACE_USER) {
408 (void) kidmap_getuidbysid(crgetzone(cr), domain,
409 FUID_RID(fuid), &id);
410 } else {
411 (void) kidmap_getgidbysid(crgetzone(cr), domain,
412 FUID_RID(fuid), &id);
413 }
414 return (id);
a405c8a6 415#else
5484965a
BB
416 /*
417 * The Linux port only supports POSIX IDs, use the passed id.
418 */
419 return (fuid);
a405c8a6 420#endif /* HAVE_KSID */
34dc7c2f
BB
421}
422
423/*
424 * Add a FUID node to the list of fuid's being created for this
425 * ACL
426 *
427 * If ACL has multiple domains, then keep only one copy of each unique
428 * domain.
429 */
428870ff 430void
34dc7c2f
BB
431zfs_fuid_node_add(zfs_fuid_info_t **fuidpp, const char *domain, uint32_t rid,
432 uint64_t idx, uint64_t id, zfs_fuid_type_t type)
433{
434 zfs_fuid_t *fuid;
435 zfs_fuid_domain_t *fuid_domain;
436 zfs_fuid_info_t *fuidp;
437 uint64_t fuididx;
438 boolean_t found = B_FALSE;
439
440 if (*fuidpp == NULL)
441 *fuidpp = zfs_fuid_info_alloc();
442
443 fuidp = *fuidpp;
444 /*
445 * First find fuid domain index in linked list
446 *
447 * If one isn't found then create an entry.
448 */
449
450 for (fuididx = 1, fuid_domain = list_head(&fuidp->z_domains);
451 fuid_domain; fuid_domain = list_next(&fuidp->z_domains,
452 fuid_domain), fuididx++) {
453 if (idx == fuid_domain->z_domidx) {
454 found = B_TRUE;
455 break;
456 }
457 }
458
459 if (!found) {
460 fuid_domain = kmem_alloc(sizeof (zfs_fuid_domain_t), KM_SLEEP);
461 fuid_domain->z_domain = domain;
462 fuid_domain->z_domidx = idx;
463 list_insert_tail(&fuidp->z_domains, fuid_domain);
464 fuidp->z_domain_str_sz += strlen(domain) + 1;
465 fuidp->z_domain_cnt++;
466 }
467
468 if (type == ZFS_ACE_USER || type == ZFS_ACE_GROUP) {
9babb374 469
34dc7c2f
BB
470 /*
471 * Now allocate fuid entry and add it on the end of the list
472 */
473
474 fuid = kmem_alloc(sizeof (zfs_fuid_t), KM_SLEEP);
475 fuid->z_id = id;
476 fuid->z_domidx = idx;
477 fuid->z_logfuid = FUID_ENCODE(fuididx, rid);
478
479 list_insert_tail(&fuidp->z_fuids, fuid);
480 fuidp->z_fuid_cnt++;
481 } else {
482 if (type == ZFS_OWNER)
483 fuidp->z_fuid_owner = FUID_ENCODE(fuididx, rid);
484 else
485 fuidp->z_fuid_group = FUID_ENCODE(fuididx, rid);
486 }
487}
488
a405c8a6 489#ifdef HAVE_KSID
34dc7c2f
BB
490/*
491 * Create a file system FUID, based on information in the users cred
428870ff
BB
492 *
493 * If cred contains KSID_OWNER then it should be used to determine
494 * the uid otherwise cred's uid will be used. By default cred's gid
495 * is used unless it's an ephemeral ID in which case KSID_GROUP will
496 * be used if it exists.
34dc7c2f
BB
497 */
498uint64_t
cae5b340 499zfs_fuid_create_cred(zfsvfs_t *zfsvfs, zfs_fuid_type_t type,
9babb374 500 cred_t *cr, zfs_fuid_info_t **fuidp)
34dc7c2f
BB
501{
502 uint64_t idx;
503 ksid_t *ksid;
504 uint32_t rid;
3558fd73 505 char *kdomain;
34dc7c2f
BB
506 const char *domain;
507 uid_t id;
508
509 VERIFY(type == ZFS_OWNER || type == ZFS_GROUP);
510
b128c09f 511 ksid = crgetsid(cr, (type == ZFS_OWNER) ? KSID_OWNER : KSID_GROUP);
428870ff 512
cae5b340 513 if (!zfsvfs->z_use_fuids || (ksid == NULL)) {
428870ff
BB
514 id = (type == ZFS_OWNER) ? crgetuid(cr) : crgetgid(cr);
515
516 if (IS_EPHEMERAL(id))
517 return ((type == ZFS_OWNER) ? UID_NOBODY : GID_NOBODY);
518
519 return ((uint64_t)id);
b128c09f 520 }
34dc7c2f 521
428870ff
BB
522 /*
523 * ksid is present and FUID is supported
524 */
525 id = (type == ZFS_OWNER) ? ksid_getid(ksid) : crgetgid(cr);
526
527 if (!IS_EPHEMERAL(id))
34dc7c2f
BB
528 return ((uint64_t)id);
529
428870ff
BB
530 if (type == ZFS_GROUP)
531 id = ksid_getid(ksid);
532
34dc7c2f
BB
533 rid = ksid_getrid(ksid);
534 domain = ksid_getdomain(ksid);
535
cae5b340 536 idx = zfs_fuid_find_by_domain(zfsvfs, domain, &kdomain, B_TRUE);
34dc7c2f
BB
537
538 zfs_fuid_node_add(fuidp, kdomain, rid, idx, id, type);
539
540 return (FUID_ENCODE(idx, rid));
541}
a405c8a6 542#endif /* HAVE_KSID */
34dc7c2f
BB
543
544/*
545 * Create a file system FUID for an ACL ace
546 * or a chown/chgrp of the file.
547 * This is similar to zfs_fuid_create_cred, except that
548 * we can't find the domain + rid information in the
549 * cred. Instead we have to query Winchester for the
550 * domain and rid.
551 *
552 * During replay operations the domain+rid information is
553 * found in the zfs_fuid_info_t that the replay code has
cae5b340 554 * attached to the zfsvfs of the file system.
34dc7c2f
BB
555 */
556uint64_t
cae5b340 557zfs_fuid_create(zfsvfs_t *zfsvfs, uint64_t id, cred_t *cr,
9babb374 558 zfs_fuid_type_t type, zfs_fuid_info_t **fuidpp)
34dc7c2f 559{
a405c8a6 560#ifdef HAVE_KSID
34dc7c2f
BB
561 const char *domain;
562 char *kdomain;
563 uint32_t fuid_idx = FUID_INDEX(id);
564 uint32_t rid;
565 idmap_stat status;
a08ee875 566 uint64_t idx = 0;
34dc7c2f 567 zfs_fuid_t *zfuid = NULL;
a08ee875 568 zfs_fuid_info_t *fuidp = NULL;
34dc7c2f
BB
569
570 /*
571 * If POSIX ID, or entry is already a FUID then
572 * just return the id
573 *
574 * We may also be handed an already FUID'ized id via
575 * chmod.
576 */
577
cae5b340 578 if (!zfsvfs->z_use_fuids || !IS_EPHEMERAL(id) || fuid_idx != 0)
34dc7c2f
BB
579 return (id);
580
cae5b340
AX
581 if (zfsvfs->z_replay) {
582 fuidp = zfsvfs->z_fuid_replay;
34dc7c2f
BB
583
584 /*
585 * If we are passed an ephemeral id, but no
586 * fuid_info was logged then return NOBODY.
587 * This is most likely a result of idmap service
588 * not being available.
589 */
590 if (fuidp == NULL)
591 return (UID_NOBODY);
592
a08ee875
LG
593 VERIFY3U(type, >=, ZFS_OWNER);
594 VERIFY3U(type, <=, ZFS_ACE_GROUP);
595
34dc7c2f
BB
596 switch (type) {
597 case ZFS_ACE_USER:
598 case ZFS_ACE_GROUP:
599 zfuid = list_head(&fuidp->z_fuids);
600 rid = FUID_RID(zfuid->z_logfuid);
601 idx = FUID_INDEX(zfuid->z_logfuid);
602 break;
603 case ZFS_OWNER:
604 rid = FUID_RID(fuidp->z_fuid_owner);
605 idx = FUID_INDEX(fuidp->z_fuid_owner);
606 break;
607 case ZFS_GROUP:
608 rid = FUID_RID(fuidp->z_fuid_group);
609 idx = FUID_INDEX(fuidp->z_fuid_group);
610 break;
611 };
a08ee875 612 domain = fuidp->z_domain_table[idx - 1];
34dc7c2f
BB
613 } else {
614 if (type == ZFS_OWNER || type == ZFS_ACE_USER)
615 status = kidmap_getsidbyuid(crgetzone(cr), id,
616 &domain, &rid);
617 else
618 status = kidmap_getsidbygid(crgetzone(cr), id,
619 &domain, &rid);
620
621 if (status != 0) {
622 /*
623 * When returning nobody we will need to
624 * make a dummy fuid table entry for logging
625 * purposes.
626 */
627 rid = UID_NOBODY;
b128c09f 628 domain = nulldomain;
34dc7c2f
BB
629 }
630 }
631
cae5b340 632 idx = zfs_fuid_find_by_domain(zfsvfs, domain, &kdomain, B_TRUE);
34dc7c2f 633
cae5b340 634 if (!zfsvfs->z_replay)
9babb374
BB
635 zfs_fuid_node_add(fuidpp, kdomain,
636 rid, idx, id, type);
34dc7c2f
BB
637 else if (zfuid != NULL) {
638 list_remove(&fuidp->z_fuids, zfuid);
639 kmem_free(zfuid, sizeof (zfs_fuid_t));
640 }
641 return (FUID_ENCODE(idx, rid));
a405c8a6 642#else
037849f8
BB
643 /*
644 * The Linux port only supports POSIX IDs, use the passed id.
645 */
646 return (id);
a405c8a6 647#endif
34dc7c2f
BB
648}
649
650void
cae5b340 651zfs_fuid_destroy(zfsvfs_t *zfsvfs)
34dc7c2f 652{
cae5b340
AX
653 rw_enter(&zfsvfs->z_fuid_lock, RW_WRITER);
654 if (!zfsvfs->z_fuid_loaded) {
655 rw_exit(&zfsvfs->z_fuid_lock);
34dc7c2f
BB
656 return;
657 }
cae5b340
AX
658 zfs_fuid_table_destroy(&zfsvfs->z_fuid_idx, &zfsvfs->z_fuid_domain);
659 rw_exit(&zfsvfs->z_fuid_lock);
34dc7c2f
BB
660}
661
662/*
663 * Allocate zfs_fuid_info for tracking FUIDs created during
664 * zfs_mknode, VOP_SETATTR() or VOP_SETSECATTR()
665 */
666zfs_fuid_info_t *
667zfs_fuid_info_alloc(void)
668{
669 zfs_fuid_info_t *fuidp;
670
671 fuidp = kmem_zalloc(sizeof (zfs_fuid_info_t), KM_SLEEP);
672 list_create(&fuidp->z_domains, sizeof (zfs_fuid_domain_t),
673 offsetof(zfs_fuid_domain_t, z_next));
674 list_create(&fuidp->z_fuids, sizeof (zfs_fuid_t),
675 offsetof(zfs_fuid_t, z_next));
676 return (fuidp);
677}
678
679/*
680 * Release all memory associated with zfs_fuid_info_t
681 */
682void
683zfs_fuid_info_free(zfs_fuid_info_t *fuidp)
684{
685 zfs_fuid_t *zfuid;
686 zfs_fuid_domain_t *zdomain;
687
688 while ((zfuid = list_head(&fuidp->z_fuids)) != NULL) {
689 list_remove(&fuidp->z_fuids, zfuid);
690 kmem_free(zfuid, sizeof (zfs_fuid_t));
691 }
692
693 if (fuidp->z_domain_table != NULL)
694 kmem_free(fuidp->z_domain_table,
cae5b340 695 (sizeof (char *)) * fuidp->z_domain_cnt);
34dc7c2f
BB
696
697 while ((zdomain = list_head(&fuidp->z_domains)) != NULL) {
698 list_remove(&fuidp->z_domains, zdomain);
699 kmem_free(zdomain, sizeof (zfs_fuid_domain_t));
700 }
701
702 kmem_free(fuidp, sizeof (zfs_fuid_info_t));
703}
704
705/*
706 * Check to see if id is a groupmember. If cred
707 * has ksid info then sidlist is checked first
708 * and if still not found then POSIX groups are checked
709 *
710 * Will use a straight FUID compare when possible.
711 */
712boolean_t
cae5b340 713zfs_groupmember(zfsvfs_t *zfsvfs, uint64_t id, cred_t *cr)
34dc7c2f 714{
a405c8a6 715#ifdef HAVE_KSID
34dc7c2f 716 ksid_t *ksid = crgetsid(cr, KSID_GROUP);
9babb374 717 ksidlist_t *ksidlist = crgetsidlist(cr);
34dc7c2f
BB
718 uid_t gid;
719
9babb374 720 if (ksid && ksidlist) {
3558fd73 721 int i;
34dc7c2f 722 ksid_t *ksid_groups;
34dc7c2f
BB
723 uint32_t idx = FUID_INDEX(id);
724 uint32_t rid = FUID_RID(id);
725
34dc7c2f
BB
726 ksid_groups = ksidlist->ksl_sids;
727
728 for (i = 0; i != ksidlist->ksl_nsid; i++) {
729 if (idx == 0) {
730 if (id != IDMAP_WK_CREATOR_GROUP_GID &&
731 id == ksid_groups[i].ks_id) {
732 return (B_TRUE);
733 }
734 } else {
9babb374 735 const char *domain;
34dc7c2f 736
cae5b340 737 domain = zfs_fuid_find_by_idx(zfsvfs, idx);
34dc7c2f
BB
738 ASSERT(domain != NULL);
739
740 if (strcmp(domain,
741 IDMAP_WK_CREATOR_SID_AUTHORITY) == 0)
742 return (B_FALSE);
743
744 if ((strcmp(domain,
745 ksid_groups[i].ks_domain->kd_name) == 0) &&
746 rid == ksid_groups[i].ks_rid)
747 return (B_TRUE);
748 }
749 }
750 }
751
752 /*
753 * Not found in ksidlist, check posix groups
754 */
cae5b340 755 gid = zfs_fuid_map_id(zfsvfs, id, cr, ZFS_GROUP);
34dc7c2f 756 return (groupmember(gid, cr));
a405c8a6
BB
757#else
758 return (B_TRUE);
759#endif
34dc7c2f 760}
9babb374
BB
761
762void
cae5b340 763zfs_fuid_txhold(zfsvfs_t *zfsvfs, dmu_tx_t *tx)
9babb374 764{
cae5b340 765 if (zfsvfs->z_fuid_obj == 0) {
9babb374
BB
766 dmu_tx_hold_bonus(tx, DMU_NEW_OBJECT);
767 dmu_tx_hold_write(tx, DMU_NEW_OBJECT, 0,
cae5b340 768 FUID_SIZE_ESTIMATE(zfsvfs));
9babb374
BB
769 dmu_tx_hold_zap(tx, MASTER_NODE_OBJ, FALSE, NULL);
770 } else {
cae5b340
AX
771 dmu_tx_hold_bonus(tx, zfsvfs->z_fuid_obj);
772 dmu_tx_hold_write(tx, zfsvfs->z_fuid_obj, 0,
773 FUID_SIZE_ESTIMATE(zfsvfs));
9babb374
BB
774 }
775}
34dc7c2f 776#endif