]> git.proxmox.com Git - mirror_ubuntu-jammy-kernel.git/blob - fs/configfs/dir.c
fs: make helpers idmap mount aware
[mirror_ubuntu-jammy-kernel.git] / fs / configfs / dir.c
1 // SPDX-License-Identifier: GPL-2.0-or-later
2 /* -*- mode: c; c-basic-offset: 8; -*-
3 * vim: noexpandtab sw=8 ts=8 sts=0:
4 *
5 * dir.c - Operations for configfs directories.
6 *
7 * Based on sysfs:
8 * sysfs is Copyright (C) 2001, 2002, 2003 Patrick Mochel
9 *
10 * configfs Copyright (C) 2005 Oracle. All rights reserved.
11 */
12
13 #undef DEBUG
14
15 #include <linux/fs.h>
16 #include <linux/fsnotify.h>
17 #include <linux/mount.h>
18 #include <linux/module.h>
19 #include <linux/slab.h>
20 #include <linux/err.h>
21
22 #include <linux/configfs.h>
23 #include "configfs_internal.h"
24
25 /*
26 * Protects mutations of configfs_dirent linkage together with proper i_mutex
27 * Also protects mutations of symlinks linkage to target configfs_dirent
28 * Mutators of configfs_dirent linkage must *both* have the proper inode locked
29 * and configfs_dirent_lock locked, in that order.
30 * This allows one to safely traverse configfs_dirent trees and symlinks without
31 * having to lock inodes.
32 *
33 * Protects setting of CONFIGFS_USET_DROPPING: checking the flag
34 * unlocked is not reliable unless in detach_groups() called from
35 * rmdir()/unregister() and from configfs_attach_group()
36 */
37 DEFINE_SPINLOCK(configfs_dirent_lock);
38
39 static void configfs_d_iput(struct dentry * dentry,
40 struct inode * inode)
41 {
42 struct configfs_dirent *sd = dentry->d_fsdata;
43
44 if (sd) {
45 /* Coordinate with configfs_readdir */
46 spin_lock(&configfs_dirent_lock);
47 /*
48 * Set sd->s_dentry to null only when this dentry is the one
49 * that is going to be killed. Otherwise configfs_d_iput may
50 * run just after configfs_attach_attr and set sd->s_dentry to
51 * NULL even it's still in use.
52 */
53 if (sd->s_dentry == dentry)
54 sd->s_dentry = NULL;
55
56 spin_unlock(&configfs_dirent_lock);
57 configfs_put(sd);
58 }
59 iput(inode);
60 }
61
62 const struct dentry_operations configfs_dentry_ops = {
63 .d_iput = configfs_d_iput,
64 .d_delete = always_delete_dentry,
65 };
66
67 #ifdef CONFIG_LOCKDEP
68
69 /*
70 * Helpers to make lockdep happy with our recursive locking of default groups'
71 * inodes (see configfs_attach_group() and configfs_detach_group()).
72 * We put default groups i_mutexes in separate classes according to their depth
73 * from the youngest non-default group ancestor.
74 *
75 * For a non-default group A having default groups A/B, A/C, and A/C/D, default
76 * groups A/B and A/C will have their inode's mutex in class
77 * default_group_class[0], and default group A/C/D will be in
78 * default_group_class[1].
79 *
80 * The lock classes are declared and assigned in inode.c, according to the
81 * s_depth value.
82 * The s_depth value is initialized to -1, adjusted to >= 0 when attaching
83 * default groups, and reset to -1 when all default groups are attached. During
84 * attachment, if configfs_create() sees s_depth > 0, the lock class of the new
85 * inode's mutex is set to default_group_class[s_depth - 1].
86 */
87
88 static void configfs_init_dirent_depth(struct configfs_dirent *sd)
89 {
90 sd->s_depth = -1;
91 }
92
93 static void configfs_set_dir_dirent_depth(struct configfs_dirent *parent_sd,
94 struct configfs_dirent *sd)
95 {
96 int parent_depth = parent_sd->s_depth;
97
98 if (parent_depth >= 0)
99 sd->s_depth = parent_depth + 1;
100 }
101
102 static void
103 configfs_adjust_dir_dirent_depth_before_populate(struct configfs_dirent *sd)
104 {
105 /*
106 * item's i_mutex class is already setup, so s_depth is now only
107 * used to set new sub-directories s_depth, which is always done
108 * with item's i_mutex locked.
109 */
110 /*
111 * sd->s_depth == -1 iff we are a non default group.
112 * else (we are a default group) sd->s_depth > 0 (see
113 * create_dir()).
114 */
115 if (sd->s_depth == -1)
116 /*
117 * We are a non default group and we are going to create
118 * default groups.
119 */
120 sd->s_depth = 0;
121 }
122
123 static void
124 configfs_adjust_dir_dirent_depth_after_populate(struct configfs_dirent *sd)
125 {
126 /* We will not create default groups anymore. */
127 sd->s_depth = -1;
128 }
129
130 #else /* CONFIG_LOCKDEP */
131
132 static void configfs_init_dirent_depth(struct configfs_dirent *sd)
133 {
134 }
135
136 static void configfs_set_dir_dirent_depth(struct configfs_dirent *parent_sd,
137 struct configfs_dirent *sd)
138 {
139 }
140
141 static void
142 configfs_adjust_dir_dirent_depth_before_populate(struct configfs_dirent *sd)
143 {
144 }
145
146 static void
147 configfs_adjust_dir_dirent_depth_after_populate(struct configfs_dirent *sd)
148 {
149 }
150
151 #endif /* CONFIG_LOCKDEP */
152
153 static struct configfs_fragment *new_fragment(void)
154 {
155 struct configfs_fragment *p;
156
157 p = kmalloc(sizeof(struct configfs_fragment), GFP_KERNEL);
158 if (p) {
159 atomic_set(&p->frag_count, 1);
160 init_rwsem(&p->frag_sem);
161 p->frag_dead = false;
162 }
163 return p;
164 }
165
166 void put_fragment(struct configfs_fragment *frag)
167 {
168 if (frag && atomic_dec_and_test(&frag->frag_count))
169 kfree(frag);
170 }
171
172 struct configfs_fragment *get_fragment(struct configfs_fragment *frag)
173 {
174 if (likely(frag))
175 atomic_inc(&frag->frag_count);
176 return frag;
177 }
178
179 /*
180 * Allocates a new configfs_dirent and links it to the parent configfs_dirent
181 */
182 static struct configfs_dirent *configfs_new_dirent(struct configfs_dirent *parent_sd,
183 void *element, int type,
184 struct configfs_fragment *frag)
185 {
186 struct configfs_dirent * sd;
187
188 sd = kmem_cache_zalloc(configfs_dir_cachep, GFP_KERNEL);
189 if (!sd)
190 return ERR_PTR(-ENOMEM);
191
192 atomic_set(&sd->s_count, 1);
193 INIT_LIST_HEAD(&sd->s_children);
194 sd->s_element = element;
195 sd->s_type = type;
196 configfs_init_dirent_depth(sd);
197 spin_lock(&configfs_dirent_lock);
198 if (parent_sd->s_type & CONFIGFS_USET_DROPPING) {
199 spin_unlock(&configfs_dirent_lock);
200 kmem_cache_free(configfs_dir_cachep, sd);
201 return ERR_PTR(-ENOENT);
202 }
203 sd->s_frag = get_fragment(frag);
204 list_add(&sd->s_sibling, &parent_sd->s_children);
205 spin_unlock(&configfs_dirent_lock);
206
207 return sd;
208 }
209
210 /*
211 *
212 * Return -EEXIST if there is already a configfs element with the same
213 * name for the same parent.
214 *
215 * called with parent inode's i_mutex held
216 */
217 static int configfs_dirent_exists(struct configfs_dirent *parent_sd,
218 const unsigned char *new)
219 {
220 struct configfs_dirent * sd;
221
222 list_for_each_entry(sd, &parent_sd->s_children, s_sibling) {
223 if (sd->s_element) {
224 const unsigned char *existing = configfs_get_name(sd);
225 if (strcmp(existing, new))
226 continue;
227 else
228 return -EEXIST;
229 }
230 }
231
232 return 0;
233 }
234
235
236 int configfs_make_dirent(struct configfs_dirent * parent_sd,
237 struct dentry * dentry, void * element,
238 umode_t mode, int type, struct configfs_fragment *frag)
239 {
240 struct configfs_dirent * sd;
241
242 sd = configfs_new_dirent(parent_sd, element, type, frag);
243 if (IS_ERR(sd))
244 return PTR_ERR(sd);
245
246 sd->s_mode = mode;
247 sd->s_dentry = dentry;
248 if (dentry)
249 dentry->d_fsdata = configfs_get(sd);
250
251 return 0;
252 }
253
254 static void configfs_remove_dirent(struct dentry *dentry)
255 {
256 struct configfs_dirent *sd = dentry->d_fsdata;
257
258 if (!sd)
259 return;
260 spin_lock(&configfs_dirent_lock);
261 list_del_init(&sd->s_sibling);
262 spin_unlock(&configfs_dirent_lock);
263 configfs_put(sd);
264 }
265
266 /**
267 * configfs_create_dir - create a directory for an config_item.
268 * @item: config_itemwe're creating directory for.
269 * @dentry: config_item's dentry.
270 * @frag: config_item's fragment.
271 *
272 * Note: user-created entries won't be allowed under this new directory
273 * until it is validated by configfs_dir_set_ready()
274 */
275
276 static int configfs_create_dir(struct config_item *item, struct dentry *dentry,
277 struct configfs_fragment *frag)
278 {
279 int error;
280 umode_t mode = S_IFDIR| S_IRWXU | S_IRUGO | S_IXUGO;
281 struct dentry *p = dentry->d_parent;
282 struct inode *inode;
283
284 BUG_ON(!item);
285
286 error = configfs_dirent_exists(p->d_fsdata, dentry->d_name.name);
287 if (unlikely(error))
288 return error;
289
290 error = configfs_make_dirent(p->d_fsdata, dentry, item, mode,
291 CONFIGFS_DIR | CONFIGFS_USET_CREATING,
292 frag);
293 if (unlikely(error))
294 return error;
295
296 configfs_set_dir_dirent_depth(p->d_fsdata, dentry->d_fsdata);
297 inode = configfs_create(dentry, mode);
298 if (IS_ERR(inode))
299 goto out_remove;
300
301 inode->i_op = &configfs_dir_inode_operations;
302 inode->i_fop = &configfs_dir_operations;
303 /* directory inodes start off with i_nlink == 2 (for "." entry) */
304 inc_nlink(inode);
305 d_instantiate(dentry, inode);
306 /* already hashed */
307 dget(dentry); /* pin directory dentries in core */
308 inc_nlink(d_inode(p));
309 item->ci_dentry = dentry;
310 return 0;
311
312 out_remove:
313 configfs_remove_dirent(dentry);
314 return PTR_ERR(inode);
315 }
316
317 /*
318 * Allow userspace to create new entries under a new directory created with
319 * configfs_create_dir(), and under all of its chidlren directories recursively.
320 * @sd configfs_dirent of the new directory to validate
321 *
322 * Caller must hold configfs_dirent_lock.
323 */
324 static void configfs_dir_set_ready(struct configfs_dirent *sd)
325 {
326 struct configfs_dirent *child_sd;
327
328 sd->s_type &= ~CONFIGFS_USET_CREATING;
329 list_for_each_entry(child_sd, &sd->s_children, s_sibling)
330 if (child_sd->s_type & CONFIGFS_USET_CREATING)
331 configfs_dir_set_ready(child_sd);
332 }
333
334 /*
335 * Check that a directory does not belong to a directory hierarchy being
336 * attached and not validated yet.
337 * @sd configfs_dirent of the directory to check
338 *
339 * @return non-zero iff the directory was validated
340 *
341 * Note: takes configfs_dirent_lock, so the result may change from false to true
342 * in two consecutive calls, but never from true to false.
343 */
344 int configfs_dirent_is_ready(struct configfs_dirent *sd)
345 {
346 int ret;
347
348 spin_lock(&configfs_dirent_lock);
349 ret = !(sd->s_type & CONFIGFS_USET_CREATING);
350 spin_unlock(&configfs_dirent_lock);
351
352 return ret;
353 }
354
355 int configfs_create_link(struct configfs_dirent *target, struct dentry *parent,
356 struct dentry *dentry, char *body)
357 {
358 int err = 0;
359 umode_t mode = S_IFLNK | S_IRWXUGO;
360 struct configfs_dirent *p = parent->d_fsdata;
361 struct inode *inode;
362
363 err = configfs_make_dirent(p, dentry, target, mode, CONFIGFS_ITEM_LINK,
364 p->s_frag);
365 if (err)
366 return err;
367
368 inode = configfs_create(dentry, mode);
369 if (IS_ERR(inode))
370 goto out_remove;
371
372 inode->i_link = body;
373 inode->i_op = &configfs_symlink_inode_operations;
374 d_instantiate(dentry, inode);
375 dget(dentry); /* pin link dentries in core */
376 return 0;
377
378 out_remove:
379 configfs_remove_dirent(dentry);
380 return PTR_ERR(inode);
381 }
382
383 static void remove_dir(struct dentry * d)
384 {
385 struct dentry * parent = dget(d->d_parent);
386
387 configfs_remove_dirent(d);
388
389 if (d_really_is_positive(d))
390 simple_rmdir(d_inode(parent),d);
391
392 pr_debug(" o %pd removing done (%d)\n", d, d_count(d));
393
394 dput(parent);
395 }
396
397 /**
398 * configfs_remove_dir - remove an config_item's directory.
399 * @item: config_item we're removing.
400 *
401 * The only thing special about this is that we remove any files in
402 * the directory before we remove the directory, and we've inlined
403 * what used to be configfs_rmdir() below, instead of calling separately.
404 *
405 * Caller holds the mutex of the item's inode
406 */
407
408 static void configfs_remove_dir(struct config_item * item)
409 {
410 struct dentry * dentry = dget(item->ci_dentry);
411
412 if (!dentry)
413 return;
414
415 remove_dir(dentry);
416 /**
417 * Drop reference from dget() on entrance.
418 */
419 dput(dentry);
420 }
421
422
423 /* attaches attribute's configfs_dirent to the dentry corresponding to the
424 * attribute file
425 */
426 static int configfs_attach_attr(struct configfs_dirent * sd, struct dentry * dentry)
427 {
428 struct configfs_attribute * attr = sd->s_element;
429 struct inode *inode;
430
431 spin_lock(&configfs_dirent_lock);
432 dentry->d_fsdata = configfs_get(sd);
433 sd->s_dentry = dentry;
434 spin_unlock(&configfs_dirent_lock);
435
436 inode = configfs_create(dentry, (attr->ca_mode & S_IALLUGO) | S_IFREG);
437 if (IS_ERR(inode)) {
438 configfs_put(sd);
439 return PTR_ERR(inode);
440 }
441 if (sd->s_type & CONFIGFS_ITEM_BIN_ATTR) {
442 inode->i_size = 0;
443 inode->i_fop = &configfs_bin_file_operations;
444 } else {
445 inode->i_size = PAGE_SIZE;
446 inode->i_fop = &configfs_file_operations;
447 }
448 d_add(dentry, inode);
449 return 0;
450 }
451
452 static struct dentry * configfs_lookup(struct inode *dir,
453 struct dentry *dentry,
454 unsigned int flags)
455 {
456 struct configfs_dirent * parent_sd = dentry->d_parent->d_fsdata;
457 struct configfs_dirent * sd;
458 int found = 0;
459 int err;
460
461 /*
462 * Fake invisibility if dir belongs to a group/default groups hierarchy
463 * being attached
464 *
465 * This forbids userspace to read/write attributes of items which may
466 * not complete their initialization, since the dentries of the
467 * attributes won't be instantiated.
468 */
469 err = -ENOENT;
470 if (!configfs_dirent_is_ready(parent_sd))
471 goto out;
472
473 list_for_each_entry(sd, &parent_sd->s_children, s_sibling) {
474 if (sd->s_type & CONFIGFS_NOT_PINNED) {
475 const unsigned char * name = configfs_get_name(sd);
476
477 if (strcmp(name, dentry->d_name.name))
478 continue;
479
480 found = 1;
481 err = configfs_attach_attr(sd, dentry);
482 break;
483 }
484 }
485
486 if (!found) {
487 /*
488 * If it doesn't exist and it isn't a NOT_PINNED item,
489 * it must be negative.
490 */
491 if (dentry->d_name.len > NAME_MAX)
492 return ERR_PTR(-ENAMETOOLONG);
493 d_add(dentry, NULL);
494 return NULL;
495 }
496
497 out:
498 return ERR_PTR(err);
499 }
500
501 /*
502 * Only subdirectories count here. Files (CONFIGFS_NOT_PINNED) are
503 * attributes and are removed by rmdir(). We recurse, setting
504 * CONFIGFS_USET_DROPPING on all children that are candidates for
505 * default detach.
506 * If there is an error, the caller will reset the flags via
507 * configfs_detach_rollback().
508 */
509 static int configfs_detach_prep(struct dentry *dentry, struct dentry **wait)
510 {
511 struct configfs_dirent *parent_sd = dentry->d_fsdata;
512 struct configfs_dirent *sd;
513 int ret;
514
515 /* Mark that we're trying to drop the group */
516 parent_sd->s_type |= CONFIGFS_USET_DROPPING;
517
518 ret = -EBUSY;
519 if (parent_sd->s_links)
520 goto out;
521
522 ret = 0;
523 list_for_each_entry(sd, &parent_sd->s_children, s_sibling) {
524 if (!sd->s_element ||
525 (sd->s_type & CONFIGFS_NOT_PINNED))
526 continue;
527 if (sd->s_type & CONFIGFS_USET_DEFAULT) {
528 /* Abort if racing with mkdir() */
529 if (sd->s_type & CONFIGFS_USET_IN_MKDIR) {
530 if (wait)
531 *wait= dget(sd->s_dentry);
532 return -EAGAIN;
533 }
534
535 /*
536 * Yup, recursive. If there's a problem, blame
537 * deep nesting of default_groups
538 */
539 ret = configfs_detach_prep(sd->s_dentry, wait);
540 if (!ret)
541 continue;
542 } else
543 ret = -ENOTEMPTY;
544
545 break;
546 }
547
548 out:
549 return ret;
550 }
551
552 /*
553 * Walk the tree, resetting CONFIGFS_USET_DROPPING wherever it was
554 * set.
555 */
556 static void configfs_detach_rollback(struct dentry *dentry)
557 {
558 struct configfs_dirent *parent_sd = dentry->d_fsdata;
559 struct configfs_dirent *sd;
560
561 parent_sd->s_type &= ~CONFIGFS_USET_DROPPING;
562
563 list_for_each_entry(sd, &parent_sd->s_children, s_sibling)
564 if (sd->s_type & CONFIGFS_USET_DEFAULT)
565 configfs_detach_rollback(sd->s_dentry);
566 }
567
568 static void detach_attrs(struct config_item * item)
569 {
570 struct dentry * dentry = dget(item->ci_dentry);
571 struct configfs_dirent * parent_sd;
572 struct configfs_dirent * sd, * tmp;
573
574 if (!dentry)
575 return;
576
577 pr_debug("configfs %s: dropping attrs for dir\n",
578 dentry->d_name.name);
579
580 parent_sd = dentry->d_fsdata;
581 list_for_each_entry_safe(sd, tmp, &parent_sd->s_children, s_sibling) {
582 if (!sd->s_element || !(sd->s_type & CONFIGFS_NOT_PINNED))
583 continue;
584 spin_lock(&configfs_dirent_lock);
585 list_del_init(&sd->s_sibling);
586 spin_unlock(&configfs_dirent_lock);
587 configfs_drop_dentry(sd, dentry);
588 configfs_put(sd);
589 }
590
591 /**
592 * Drop reference from dget() on entrance.
593 */
594 dput(dentry);
595 }
596
597 static int populate_attrs(struct config_item *item)
598 {
599 const struct config_item_type *t = item->ci_type;
600 struct configfs_attribute *attr;
601 struct configfs_bin_attribute *bin_attr;
602 int error = 0;
603 int i;
604
605 if (!t)
606 return -EINVAL;
607 if (t->ct_attrs) {
608 for (i = 0; (attr = t->ct_attrs[i]) != NULL; i++) {
609 if ((error = configfs_create_file(item, attr)))
610 break;
611 }
612 }
613 if (t->ct_bin_attrs) {
614 for (i = 0; (bin_attr = t->ct_bin_attrs[i]) != NULL; i++) {
615 error = configfs_create_bin_file(item, bin_attr);
616 if (error)
617 break;
618 }
619 }
620
621 if (error)
622 detach_attrs(item);
623
624 return error;
625 }
626
627 static int configfs_attach_group(struct config_item *parent_item,
628 struct config_item *item,
629 struct dentry *dentry,
630 struct configfs_fragment *frag);
631 static void configfs_detach_group(struct config_item *item);
632
633 static void detach_groups(struct config_group *group)
634 {
635 struct dentry * dentry = dget(group->cg_item.ci_dentry);
636 struct dentry *child;
637 struct configfs_dirent *parent_sd;
638 struct configfs_dirent *sd, *tmp;
639
640 if (!dentry)
641 return;
642
643 parent_sd = dentry->d_fsdata;
644 list_for_each_entry_safe(sd, tmp, &parent_sd->s_children, s_sibling) {
645 if (!sd->s_element ||
646 !(sd->s_type & CONFIGFS_USET_DEFAULT))
647 continue;
648
649 child = sd->s_dentry;
650
651 inode_lock(d_inode(child));
652
653 configfs_detach_group(sd->s_element);
654 d_inode(child)->i_flags |= S_DEAD;
655 dont_mount(child);
656
657 inode_unlock(d_inode(child));
658
659 d_delete(child);
660 dput(child);
661 }
662
663 /**
664 * Drop reference from dget() on entrance.
665 */
666 dput(dentry);
667 }
668
669 /*
670 * This fakes mkdir(2) on a default_groups[] entry. It
671 * creates a dentry, attachs it, and then does fixup
672 * on the sd->s_type.
673 *
674 * We could, perhaps, tweak our parent's ->mkdir for a minute and
675 * try using vfs_mkdir. Just a thought.
676 */
677 static int create_default_group(struct config_group *parent_group,
678 struct config_group *group,
679 struct configfs_fragment *frag)
680 {
681 int ret;
682 struct configfs_dirent *sd;
683 /* We trust the caller holds a reference to parent */
684 struct dentry *child, *parent = parent_group->cg_item.ci_dentry;
685
686 if (!group->cg_item.ci_name)
687 group->cg_item.ci_name = group->cg_item.ci_namebuf;
688
689 ret = -ENOMEM;
690 child = d_alloc_name(parent, group->cg_item.ci_name);
691 if (child) {
692 d_add(child, NULL);
693
694 ret = configfs_attach_group(&parent_group->cg_item,
695 &group->cg_item, child, frag);
696 if (!ret) {
697 sd = child->d_fsdata;
698 sd->s_type |= CONFIGFS_USET_DEFAULT;
699 } else {
700 BUG_ON(d_inode(child));
701 d_drop(child);
702 dput(child);
703 }
704 }
705
706 return ret;
707 }
708
709 static int populate_groups(struct config_group *group,
710 struct configfs_fragment *frag)
711 {
712 struct config_group *new_group;
713 int ret = 0;
714
715 list_for_each_entry(new_group, &group->default_groups, group_entry) {
716 ret = create_default_group(group, new_group, frag);
717 if (ret) {
718 detach_groups(group);
719 break;
720 }
721 }
722
723 return ret;
724 }
725
726 void configfs_remove_default_groups(struct config_group *group)
727 {
728 struct config_group *g, *n;
729
730 list_for_each_entry_safe(g, n, &group->default_groups, group_entry) {
731 list_del(&g->group_entry);
732 config_item_put(&g->cg_item);
733 }
734 }
735 EXPORT_SYMBOL(configfs_remove_default_groups);
736
737 /*
738 * All of link_obj/unlink_obj/link_group/unlink_group require that
739 * subsys->su_mutex is held.
740 */
741
742 static void unlink_obj(struct config_item *item)
743 {
744 struct config_group *group;
745
746 group = item->ci_group;
747 if (group) {
748 list_del_init(&item->ci_entry);
749
750 item->ci_group = NULL;
751 item->ci_parent = NULL;
752
753 /* Drop the reference for ci_entry */
754 config_item_put(item);
755
756 /* Drop the reference for ci_parent */
757 config_group_put(group);
758 }
759 }
760
761 static void link_obj(struct config_item *parent_item, struct config_item *item)
762 {
763 /*
764 * Parent seems redundant with group, but it makes certain
765 * traversals much nicer.
766 */
767 item->ci_parent = parent_item;
768
769 /*
770 * We hold a reference on the parent for the child's ci_parent
771 * link.
772 */
773 item->ci_group = config_group_get(to_config_group(parent_item));
774 list_add_tail(&item->ci_entry, &item->ci_group->cg_children);
775
776 /*
777 * We hold a reference on the child for ci_entry on the parent's
778 * cg_children
779 */
780 config_item_get(item);
781 }
782
783 static void unlink_group(struct config_group *group)
784 {
785 struct config_group *new_group;
786
787 list_for_each_entry(new_group, &group->default_groups, group_entry)
788 unlink_group(new_group);
789
790 group->cg_subsys = NULL;
791 unlink_obj(&group->cg_item);
792 }
793
794 static void link_group(struct config_group *parent_group, struct config_group *group)
795 {
796 struct config_group *new_group;
797 struct configfs_subsystem *subsys = NULL; /* gcc is a turd */
798
799 link_obj(&parent_group->cg_item, &group->cg_item);
800
801 if (parent_group->cg_subsys)
802 subsys = parent_group->cg_subsys;
803 else if (configfs_is_root(&parent_group->cg_item))
804 subsys = to_configfs_subsystem(group);
805 else
806 BUG();
807 group->cg_subsys = subsys;
808
809 list_for_each_entry(new_group, &group->default_groups, group_entry)
810 link_group(group, new_group);
811 }
812
813 /*
814 * The goal is that configfs_attach_item() (and
815 * configfs_attach_group()) can be called from either the VFS or this
816 * module. That is, they assume that the items have been created,
817 * the dentry allocated, and the dcache is all ready to go.
818 *
819 * If they fail, they must clean up after themselves as if they
820 * had never been called. The caller (VFS or local function) will
821 * handle cleaning up the dcache bits.
822 *
823 * configfs_detach_group() and configfs_detach_item() behave similarly on
824 * the way out. They assume that the proper semaphores are held, they
825 * clean up the configfs items, and they expect their callers will
826 * handle the dcache bits.
827 */
828 static int configfs_attach_item(struct config_item *parent_item,
829 struct config_item *item,
830 struct dentry *dentry,
831 struct configfs_fragment *frag)
832 {
833 int ret;
834
835 ret = configfs_create_dir(item, dentry, frag);
836 if (!ret) {
837 ret = populate_attrs(item);
838 if (ret) {
839 /*
840 * We are going to remove an inode and its dentry but
841 * the VFS may already have hit and used them. Thus,
842 * we must lock them as rmdir() would.
843 */
844 inode_lock(d_inode(dentry));
845 configfs_remove_dir(item);
846 d_inode(dentry)->i_flags |= S_DEAD;
847 dont_mount(dentry);
848 inode_unlock(d_inode(dentry));
849 d_delete(dentry);
850 }
851 }
852
853 return ret;
854 }
855
856 /* Caller holds the mutex of the item's inode */
857 static void configfs_detach_item(struct config_item *item)
858 {
859 detach_attrs(item);
860 configfs_remove_dir(item);
861 }
862
863 static int configfs_attach_group(struct config_item *parent_item,
864 struct config_item *item,
865 struct dentry *dentry,
866 struct configfs_fragment *frag)
867 {
868 int ret;
869 struct configfs_dirent *sd;
870
871 ret = configfs_attach_item(parent_item, item, dentry, frag);
872 if (!ret) {
873 sd = dentry->d_fsdata;
874 sd->s_type |= CONFIGFS_USET_DIR;
875
876 /*
877 * FYI, we're faking mkdir in populate_groups()
878 * We must lock the group's inode to avoid races with the VFS
879 * which can already hit the inode and try to add/remove entries
880 * under it.
881 *
882 * We must also lock the inode to remove it safely in case of
883 * error, as rmdir() would.
884 */
885 inode_lock_nested(d_inode(dentry), I_MUTEX_CHILD);
886 configfs_adjust_dir_dirent_depth_before_populate(sd);
887 ret = populate_groups(to_config_group(item), frag);
888 if (ret) {
889 configfs_detach_item(item);
890 d_inode(dentry)->i_flags |= S_DEAD;
891 dont_mount(dentry);
892 }
893 configfs_adjust_dir_dirent_depth_after_populate(sd);
894 inode_unlock(d_inode(dentry));
895 if (ret)
896 d_delete(dentry);
897 }
898
899 return ret;
900 }
901
902 /* Caller holds the mutex of the group's inode */
903 static void configfs_detach_group(struct config_item *item)
904 {
905 detach_groups(to_config_group(item));
906 configfs_detach_item(item);
907 }
908
909 /*
910 * After the item has been detached from the filesystem view, we are
911 * ready to tear it out of the hierarchy. Notify the client before
912 * we do that so they can perform any cleanup that requires
913 * navigating the hierarchy. A client does not need to provide this
914 * callback. The subsystem semaphore MUST be held by the caller, and
915 * references must be valid for both items. It also assumes the
916 * caller has validated ci_type.
917 */
918 static void client_disconnect_notify(struct config_item *parent_item,
919 struct config_item *item)
920 {
921 const struct config_item_type *type;
922
923 type = parent_item->ci_type;
924 BUG_ON(!type);
925
926 if (type->ct_group_ops && type->ct_group_ops->disconnect_notify)
927 type->ct_group_ops->disconnect_notify(to_config_group(parent_item),
928 item);
929 }
930
931 /*
932 * Drop the initial reference from make_item()/make_group()
933 * This function assumes that reference is held on item
934 * and that item holds a valid reference to the parent. Also, it
935 * assumes the caller has validated ci_type.
936 */
937 static void client_drop_item(struct config_item *parent_item,
938 struct config_item *item)
939 {
940 const struct config_item_type *type;
941
942 type = parent_item->ci_type;
943 BUG_ON(!type);
944
945 /*
946 * If ->drop_item() exists, it is responsible for the
947 * config_item_put().
948 */
949 if (type->ct_group_ops && type->ct_group_ops->drop_item)
950 type->ct_group_ops->drop_item(to_config_group(parent_item),
951 item);
952 else
953 config_item_put(item);
954 }
955
956 #ifdef DEBUG
957 static void configfs_dump_one(struct configfs_dirent *sd, int level)
958 {
959 pr_info("%*s\"%s\":\n", level, " ", configfs_get_name(sd));
960
961 #define type_print(_type) if (sd->s_type & _type) pr_info("%*s %s\n", level, " ", #_type);
962 type_print(CONFIGFS_ROOT);
963 type_print(CONFIGFS_DIR);
964 type_print(CONFIGFS_ITEM_ATTR);
965 type_print(CONFIGFS_ITEM_LINK);
966 type_print(CONFIGFS_USET_DIR);
967 type_print(CONFIGFS_USET_DEFAULT);
968 type_print(CONFIGFS_USET_DROPPING);
969 #undef type_print
970 }
971
972 static int configfs_dump(struct configfs_dirent *sd, int level)
973 {
974 struct configfs_dirent *child_sd;
975 int ret = 0;
976
977 configfs_dump_one(sd, level);
978
979 if (!(sd->s_type & (CONFIGFS_DIR|CONFIGFS_ROOT)))
980 return 0;
981
982 list_for_each_entry(child_sd, &sd->s_children, s_sibling) {
983 ret = configfs_dump(child_sd, level + 2);
984 if (ret)
985 break;
986 }
987
988 return ret;
989 }
990 #endif
991
992
993 /*
994 * configfs_depend_item() and configfs_undepend_item()
995 *
996 * WARNING: Do not call these from a configfs callback!
997 *
998 * This describes these functions and their helpers.
999 *
1000 * Allow another kernel system to depend on a config_item. If this
1001 * happens, the item cannot go away until the dependent can live without
1002 * it. The idea is to give client modules as simple an interface as
1003 * possible. When a system asks them to depend on an item, they just
1004 * call configfs_depend_item(). If the item is live and the client
1005 * driver is in good shape, we'll happily do the work for them.
1006 *
1007 * Why is the locking complex? Because configfs uses the VFS to handle
1008 * all locking, but this function is called outside the normal
1009 * VFS->configfs path. So it must take VFS locks to prevent the
1010 * VFS->configfs stuff (configfs_mkdir(), configfs_rmdir(), etc). This is
1011 * why you can't call these functions underneath configfs callbacks.
1012 *
1013 * Note, btw, that this can be called at *any* time, even when a configfs
1014 * subsystem isn't registered, or when configfs is loading or unloading.
1015 * Just like configfs_register_subsystem(). So we take the same
1016 * precautions. We pin the filesystem. We lock configfs_dirent_lock.
1017 * If we can find the target item in the
1018 * configfs tree, it must be part of the subsystem tree as well, so we
1019 * do not need the subsystem semaphore. Holding configfs_dirent_lock helps
1020 * locking out mkdir() and rmdir(), who might be racing us.
1021 */
1022
1023 /*
1024 * configfs_depend_prep()
1025 *
1026 * Only subdirectories count here. Files (CONFIGFS_NOT_PINNED) are
1027 * attributes. This is similar but not the same to configfs_detach_prep().
1028 * Note that configfs_detach_prep() expects the parent to be locked when it
1029 * is called, but we lock the parent *inside* configfs_depend_prep(). We
1030 * do that so we can unlock it if we find nothing.
1031 *
1032 * Here we do a depth-first search of the dentry hierarchy looking for
1033 * our object.
1034 * We deliberately ignore items tagged as dropping since they are virtually
1035 * dead, as well as items in the middle of attachment since they virtually
1036 * do not exist yet. This completes the locking out of racing mkdir() and
1037 * rmdir().
1038 * Note: subdirectories in the middle of attachment start with s_type =
1039 * CONFIGFS_DIR|CONFIGFS_USET_CREATING set by create_dir(). When
1040 * CONFIGFS_USET_CREATING is set, we ignore the item. The actual set of
1041 * s_type is in configfs_new_dirent(), which has configfs_dirent_lock.
1042 *
1043 * If the target is not found, -ENOENT is bubbled up.
1044 *
1045 * This adds a requirement that all config_items be unique!
1046 *
1047 * This is recursive. There isn't
1048 * much on the stack, though, so folks that need this function - be careful
1049 * about your stack! Patches will be accepted to make it iterative.
1050 */
1051 static int configfs_depend_prep(struct dentry *origin,
1052 struct config_item *target)
1053 {
1054 struct configfs_dirent *child_sd, *sd;
1055 int ret = 0;
1056
1057 BUG_ON(!origin || !origin->d_fsdata);
1058 sd = origin->d_fsdata;
1059
1060 if (sd->s_element == target) /* Boo-yah */
1061 goto out;
1062
1063 list_for_each_entry(child_sd, &sd->s_children, s_sibling) {
1064 if ((child_sd->s_type & CONFIGFS_DIR) &&
1065 !(child_sd->s_type & CONFIGFS_USET_DROPPING) &&
1066 !(child_sd->s_type & CONFIGFS_USET_CREATING)) {
1067 ret = configfs_depend_prep(child_sd->s_dentry,
1068 target);
1069 if (!ret)
1070 goto out; /* Child path boo-yah */
1071 }
1072 }
1073
1074 /* We looped all our children and didn't find target */
1075 ret = -ENOENT;
1076
1077 out:
1078 return ret;
1079 }
1080
1081 static int configfs_do_depend_item(struct dentry *subsys_dentry,
1082 struct config_item *target)
1083 {
1084 struct configfs_dirent *p;
1085 int ret;
1086
1087 spin_lock(&configfs_dirent_lock);
1088 /* Scan the tree, return 0 if found */
1089 ret = configfs_depend_prep(subsys_dentry, target);
1090 if (ret)
1091 goto out_unlock_dirent_lock;
1092
1093 /*
1094 * We are sure that the item is not about to be removed by rmdir(), and
1095 * not in the middle of attachment by mkdir().
1096 */
1097 p = target->ci_dentry->d_fsdata;
1098 p->s_dependent_count += 1;
1099
1100 out_unlock_dirent_lock:
1101 spin_unlock(&configfs_dirent_lock);
1102
1103 return ret;
1104 }
1105
1106 static inline struct configfs_dirent *
1107 configfs_find_subsys_dentry(struct configfs_dirent *root_sd,
1108 struct config_item *subsys_item)
1109 {
1110 struct configfs_dirent *p;
1111 struct configfs_dirent *ret = NULL;
1112
1113 list_for_each_entry(p, &root_sd->s_children, s_sibling) {
1114 if (p->s_type & CONFIGFS_DIR &&
1115 p->s_element == subsys_item) {
1116 ret = p;
1117 break;
1118 }
1119 }
1120
1121 return ret;
1122 }
1123
1124
1125 int configfs_depend_item(struct configfs_subsystem *subsys,
1126 struct config_item *target)
1127 {
1128 int ret;
1129 struct configfs_dirent *subsys_sd;
1130 struct config_item *s_item = &subsys->su_group.cg_item;
1131 struct dentry *root;
1132
1133 /*
1134 * Pin the configfs filesystem. This means we can safely access
1135 * the root of the configfs filesystem.
1136 */
1137 root = configfs_pin_fs();
1138 if (IS_ERR(root))
1139 return PTR_ERR(root);
1140
1141 /*
1142 * Next, lock the root directory. We're going to check that the
1143 * subsystem is really registered, and so we need to lock out
1144 * configfs_[un]register_subsystem().
1145 */
1146 inode_lock(d_inode(root));
1147
1148 subsys_sd = configfs_find_subsys_dentry(root->d_fsdata, s_item);
1149 if (!subsys_sd) {
1150 ret = -ENOENT;
1151 goto out_unlock_fs;
1152 }
1153
1154 /* Ok, now we can trust subsys/s_item */
1155 ret = configfs_do_depend_item(subsys_sd->s_dentry, target);
1156
1157 out_unlock_fs:
1158 inode_unlock(d_inode(root));
1159
1160 /*
1161 * If we succeeded, the fs is pinned via other methods. If not,
1162 * we're done with it anyway. So release_fs() is always right.
1163 */
1164 configfs_release_fs();
1165
1166 return ret;
1167 }
1168 EXPORT_SYMBOL(configfs_depend_item);
1169
1170 /*
1171 * Release the dependent linkage. This is much simpler than
1172 * configfs_depend_item() because we know that the client driver is
1173 * pinned, thus the subsystem is pinned, and therefore configfs is pinned.
1174 */
1175 void configfs_undepend_item(struct config_item *target)
1176 {
1177 struct configfs_dirent *sd;
1178
1179 /*
1180 * Since we can trust everything is pinned, we just need
1181 * configfs_dirent_lock.
1182 */
1183 spin_lock(&configfs_dirent_lock);
1184
1185 sd = target->ci_dentry->d_fsdata;
1186 BUG_ON(sd->s_dependent_count < 1);
1187
1188 sd->s_dependent_count -= 1;
1189
1190 /*
1191 * After this unlock, we cannot trust the item to stay alive!
1192 * DO NOT REFERENCE item after this unlock.
1193 */
1194 spin_unlock(&configfs_dirent_lock);
1195 }
1196 EXPORT_SYMBOL(configfs_undepend_item);
1197
1198 /*
1199 * caller_subsys is a caller's subsystem not target's. This is used to
1200 * determine if we should lock root and check subsys or not. When we are
1201 * in the same subsystem as our target there is no need to do locking as
1202 * we know that subsys is valid and is not unregistered during this function
1203 * as we are called from callback of one of his children and VFS holds a lock
1204 * on some inode. Otherwise we have to lock our root to ensure that target's
1205 * subsystem it is not unregistered during this function.
1206 */
1207 int configfs_depend_item_unlocked(struct configfs_subsystem *caller_subsys,
1208 struct config_item *target)
1209 {
1210 struct configfs_subsystem *target_subsys;
1211 struct config_group *root, *parent;
1212 struct configfs_dirent *subsys_sd;
1213 int ret = -ENOENT;
1214
1215 /* Disallow this function for configfs root */
1216 if (configfs_is_root(target))
1217 return -EINVAL;
1218
1219 parent = target->ci_group;
1220 /*
1221 * This may happen when someone is trying to depend root
1222 * directory of some subsystem
1223 */
1224 if (configfs_is_root(&parent->cg_item)) {
1225 target_subsys = to_configfs_subsystem(to_config_group(target));
1226 root = parent;
1227 } else {
1228 target_subsys = parent->cg_subsys;
1229 /* Find a cofnigfs root as we may need it for locking */
1230 for (root = parent; !configfs_is_root(&root->cg_item);
1231 root = root->cg_item.ci_group)
1232 ;
1233 }
1234
1235 if (target_subsys != caller_subsys) {
1236 /*
1237 * We are in other configfs subsystem, so we have to do
1238 * additional locking to prevent other subsystem from being
1239 * unregistered
1240 */
1241 inode_lock(d_inode(root->cg_item.ci_dentry));
1242
1243 /*
1244 * As we are trying to depend item from other subsystem
1245 * we have to check if this subsystem is still registered
1246 */
1247 subsys_sd = configfs_find_subsys_dentry(
1248 root->cg_item.ci_dentry->d_fsdata,
1249 &target_subsys->su_group.cg_item);
1250 if (!subsys_sd)
1251 goto out_root_unlock;
1252 } else {
1253 subsys_sd = target_subsys->su_group.cg_item.ci_dentry->d_fsdata;
1254 }
1255
1256 /* Now we can execute core of depend item */
1257 ret = configfs_do_depend_item(subsys_sd->s_dentry, target);
1258
1259 if (target_subsys != caller_subsys)
1260 out_root_unlock:
1261 /*
1262 * We were called from subsystem other than our target so we
1263 * took some locks so now it's time to release them
1264 */
1265 inode_unlock(d_inode(root->cg_item.ci_dentry));
1266
1267 return ret;
1268 }
1269 EXPORT_SYMBOL(configfs_depend_item_unlocked);
1270
1271 static int configfs_mkdir(struct user_namespace *mnt_userns, struct inode *dir,
1272 struct dentry *dentry, umode_t mode)
1273 {
1274 int ret = 0;
1275 int module_got = 0;
1276 struct config_group *group = NULL;
1277 struct config_item *item = NULL;
1278 struct config_item *parent_item;
1279 struct configfs_subsystem *subsys;
1280 struct configfs_dirent *sd;
1281 const struct config_item_type *type;
1282 struct module *subsys_owner = NULL, *new_item_owner = NULL;
1283 struct configfs_fragment *frag;
1284 char *name;
1285
1286 sd = dentry->d_parent->d_fsdata;
1287
1288 /*
1289 * Fake invisibility if dir belongs to a group/default groups hierarchy
1290 * being attached
1291 */
1292 if (!configfs_dirent_is_ready(sd)) {
1293 ret = -ENOENT;
1294 goto out;
1295 }
1296
1297 if (!(sd->s_type & CONFIGFS_USET_DIR)) {
1298 ret = -EPERM;
1299 goto out;
1300 }
1301
1302 frag = new_fragment();
1303 if (!frag) {
1304 ret = -ENOMEM;
1305 goto out;
1306 }
1307
1308 /* Get a working ref for the duration of this function */
1309 parent_item = configfs_get_config_item(dentry->d_parent);
1310 type = parent_item->ci_type;
1311 subsys = to_config_group(parent_item)->cg_subsys;
1312 BUG_ON(!subsys);
1313
1314 if (!type || !type->ct_group_ops ||
1315 (!type->ct_group_ops->make_group &&
1316 !type->ct_group_ops->make_item)) {
1317 ret = -EPERM; /* Lack-of-mkdir returns -EPERM */
1318 goto out_put;
1319 }
1320
1321 /*
1322 * The subsystem may belong to a different module than the item
1323 * being created. We don't want to safely pin the new item but
1324 * fail to pin the subsystem it sits under.
1325 */
1326 if (!subsys->su_group.cg_item.ci_type) {
1327 ret = -EINVAL;
1328 goto out_put;
1329 }
1330 subsys_owner = subsys->su_group.cg_item.ci_type->ct_owner;
1331 if (!try_module_get(subsys_owner)) {
1332 ret = -EINVAL;
1333 goto out_put;
1334 }
1335
1336 name = kmalloc(dentry->d_name.len + 1, GFP_KERNEL);
1337 if (!name) {
1338 ret = -ENOMEM;
1339 goto out_subsys_put;
1340 }
1341
1342 snprintf(name, dentry->d_name.len + 1, "%s", dentry->d_name.name);
1343
1344 mutex_lock(&subsys->su_mutex);
1345 if (type->ct_group_ops->make_group) {
1346 group = type->ct_group_ops->make_group(to_config_group(parent_item), name);
1347 if (!group)
1348 group = ERR_PTR(-ENOMEM);
1349 if (!IS_ERR(group)) {
1350 link_group(to_config_group(parent_item), group);
1351 item = &group->cg_item;
1352 } else
1353 ret = PTR_ERR(group);
1354 } else {
1355 item = type->ct_group_ops->make_item(to_config_group(parent_item), name);
1356 if (!item)
1357 item = ERR_PTR(-ENOMEM);
1358 if (!IS_ERR(item))
1359 link_obj(parent_item, item);
1360 else
1361 ret = PTR_ERR(item);
1362 }
1363 mutex_unlock(&subsys->su_mutex);
1364
1365 kfree(name);
1366 if (ret) {
1367 /*
1368 * If ret != 0, then link_obj() was never called.
1369 * There are no extra references to clean up.
1370 */
1371 goto out_subsys_put;
1372 }
1373
1374 /*
1375 * link_obj() has been called (via link_group() for groups).
1376 * From here on out, errors must clean that up.
1377 */
1378
1379 type = item->ci_type;
1380 if (!type) {
1381 ret = -EINVAL;
1382 goto out_unlink;
1383 }
1384
1385 new_item_owner = type->ct_owner;
1386 if (!try_module_get(new_item_owner)) {
1387 ret = -EINVAL;
1388 goto out_unlink;
1389 }
1390
1391 /*
1392 * I hate doing it this way, but if there is
1393 * an error, module_put() probably should
1394 * happen after any cleanup.
1395 */
1396 module_got = 1;
1397
1398 /*
1399 * Make racing rmdir() fail if it did not tag parent with
1400 * CONFIGFS_USET_DROPPING
1401 * Note: if CONFIGFS_USET_DROPPING is already set, attach_group() will
1402 * fail and let rmdir() terminate correctly
1403 */
1404 spin_lock(&configfs_dirent_lock);
1405 /* This will make configfs_detach_prep() fail */
1406 sd->s_type |= CONFIGFS_USET_IN_MKDIR;
1407 spin_unlock(&configfs_dirent_lock);
1408
1409 if (group)
1410 ret = configfs_attach_group(parent_item, item, dentry, frag);
1411 else
1412 ret = configfs_attach_item(parent_item, item, dentry, frag);
1413
1414 spin_lock(&configfs_dirent_lock);
1415 sd->s_type &= ~CONFIGFS_USET_IN_MKDIR;
1416 if (!ret)
1417 configfs_dir_set_ready(dentry->d_fsdata);
1418 spin_unlock(&configfs_dirent_lock);
1419
1420 out_unlink:
1421 if (ret) {
1422 /* Tear down everything we built up */
1423 mutex_lock(&subsys->su_mutex);
1424
1425 client_disconnect_notify(parent_item, item);
1426 if (group)
1427 unlink_group(group);
1428 else
1429 unlink_obj(item);
1430 client_drop_item(parent_item, item);
1431
1432 mutex_unlock(&subsys->su_mutex);
1433
1434 if (module_got)
1435 module_put(new_item_owner);
1436 }
1437
1438 out_subsys_put:
1439 if (ret)
1440 module_put(subsys_owner);
1441
1442 out_put:
1443 /*
1444 * link_obj()/link_group() took a reference from child->parent,
1445 * so the parent is safely pinned. We can drop our working
1446 * reference.
1447 */
1448 config_item_put(parent_item);
1449 put_fragment(frag);
1450
1451 out:
1452 return ret;
1453 }
1454
1455 static int configfs_rmdir(struct inode *dir, struct dentry *dentry)
1456 {
1457 struct config_item *parent_item;
1458 struct config_item *item;
1459 struct configfs_subsystem *subsys;
1460 struct configfs_dirent *sd;
1461 struct configfs_fragment *frag;
1462 struct module *subsys_owner = NULL, *dead_item_owner = NULL;
1463 int ret;
1464
1465 sd = dentry->d_fsdata;
1466 if (sd->s_type & CONFIGFS_USET_DEFAULT)
1467 return -EPERM;
1468
1469 /* Get a working ref until we have the child */
1470 parent_item = configfs_get_config_item(dentry->d_parent);
1471 subsys = to_config_group(parent_item)->cg_subsys;
1472 BUG_ON(!subsys);
1473
1474 if (!parent_item->ci_type) {
1475 config_item_put(parent_item);
1476 return -EINVAL;
1477 }
1478
1479 /* configfs_mkdir() shouldn't have allowed this */
1480 BUG_ON(!subsys->su_group.cg_item.ci_type);
1481 subsys_owner = subsys->su_group.cg_item.ci_type->ct_owner;
1482
1483 /*
1484 * Ensure that no racing symlink() will make detach_prep() fail while
1485 * the new link is temporarily attached
1486 */
1487 do {
1488 struct dentry *wait;
1489
1490 mutex_lock(&configfs_symlink_mutex);
1491 spin_lock(&configfs_dirent_lock);
1492 /*
1493 * Here's where we check for dependents. We're protected by
1494 * configfs_dirent_lock.
1495 * If no dependent, atomically tag the item as dropping.
1496 */
1497 ret = sd->s_dependent_count ? -EBUSY : 0;
1498 if (!ret) {
1499 ret = configfs_detach_prep(dentry, &wait);
1500 if (ret)
1501 configfs_detach_rollback(dentry);
1502 }
1503 spin_unlock(&configfs_dirent_lock);
1504 mutex_unlock(&configfs_symlink_mutex);
1505
1506 if (ret) {
1507 if (ret != -EAGAIN) {
1508 config_item_put(parent_item);
1509 return ret;
1510 }
1511
1512 /* Wait until the racing operation terminates */
1513 inode_lock(d_inode(wait));
1514 inode_unlock(d_inode(wait));
1515 dput(wait);
1516 }
1517 } while (ret == -EAGAIN);
1518
1519 frag = sd->s_frag;
1520 if (down_write_killable(&frag->frag_sem)) {
1521 spin_lock(&configfs_dirent_lock);
1522 configfs_detach_rollback(dentry);
1523 spin_unlock(&configfs_dirent_lock);
1524 config_item_put(parent_item);
1525 return -EINTR;
1526 }
1527 frag->frag_dead = true;
1528 up_write(&frag->frag_sem);
1529
1530 /* Get a working ref for the duration of this function */
1531 item = configfs_get_config_item(dentry);
1532
1533 /* Drop reference from above, item already holds one. */
1534 config_item_put(parent_item);
1535
1536 if (item->ci_type)
1537 dead_item_owner = item->ci_type->ct_owner;
1538
1539 if (sd->s_type & CONFIGFS_USET_DIR) {
1540 configfs_detach_group(item);
1541
1542 mutex_lock(&subsys->su_mutex);
1543 client_disconnect_notify(parent_item, item);
1544 unlink_group(to_config_group(item));
1545 } else {
1546 configfs_detach_item(item);
1547
1548 mutex_lock(&subsys->su_mutex);
1549 client_disconnect_notify(parent_item, item);
1550 unlink_obj(item);
1551 }
1552
1553 client_drop_item(parent_item, item);
1554 mutex_unlock(&subsys->su_mutex);
1555
1556 /* Drop our reference from above */
1557 config_item_put(item);
1558
1559 module_put(dead_item_owner);
1560 module_put(subsys_owner);
1561
1562 return 0;
1563 }
1564
1565 const struct inode_operations configfs_dir_inode_operations = {
1566 .mkdir = configfs_mkdir,
1567 .rmdir = configfs_rmdir,
1568 .symlink = configfs_symlink,
1569 .unlink = configfs_unlink,
1570 .lookup = configfs_lookup,
1571 .setattr = configfs_setattr,
1572 };
1573
1574 const struct inode_operations configfs_root_inode_operations = {
1575 .lookup = configfs_lookup,
1576 .setattr = configfs_setattr,
1577 };
1578
1579 static int configfs_dir_open(struct inode *inode, struct file *file)
1580 {
1581 struct dentry * dentry = file->f_path.dentry;
1582 struct configfs_dirent * parent_sd = dentry->d_fsdata;
1583 int err;
1584
1585 inode_lock(d_inode(dentry));
1586 /*
1587 * Fake invisibility if dir belongs to a group/default groups hierarchy
1588 * being attached
1589 */
1590 err = -ENOENT;
1591 if (configfs_dirent_is_ready(parent_sd)) {
1592 file->private_data = configfs_new_dirent(parent_sd, NULL, 0, NULL);
1593 if (IS_ERR(file->private_data))
1594 err = PTR_ERR(file->private_data);
1595 else
1596 err = 0;
1597 }
1598 inode_unlock(d_inode(dentry));
1599
1600 return err;
1601 }
1602
1603 static int configfs_dir_close(struct inode *inode, struct file *file)
1604 {
1605 struct dentry * dentry = file->f_path.dentry;
1606 struct configfs_dirent * cursor = file->private_data;
1607
1608 inode_lock(d_inode(dentry));
1609 spin_lock(&configfs_dirent_lock);
1610 list_del_init(&cursor->s_sibling);
1611 spin_unlock(&configfs_dirent_lock);
1612 inode_unlock(d_inode(dentry));
1613
1614 release_configfs_dirent(cursor);
1615
1616 return 0;
1617 }
1618
1619 /* Relationship between s_mode and the DT_xxx types */
1620 static inline unsigned char dt_type(struct configfs_dirent *sd)
1621 {
1622 return (sd->s_mode >> 12) & 15;
1623 }
1624
1625 static int configfs_readdir(struct file *file, struct dir_context *ctx)
1626 {
1627 struct dentry *dentry = file->f_path.dentry;
1628 struct super_block *sb = dentry->d_sb;
1629 struct configfs_dirent * parent_sd = dentry->d_fsdata;
1630 struct configfs_dirent *cursor = file->private_data;
1631 struct list_head *p, *q = &cursor->s_sibling;
1632 ino_t ino = 0;
1633
1634 if (!dir_emit_dots(file, ctx))
1635 return 0;
1636 spin_lock(&configfs_dirent_lock);
1637 if (ctx->pos == 2)
1638 list_move(q, &parent_sd->s_children);
1639 for (p = q->next; p != &parent_sd->s_children; p = p->next) {
1640 struct configfs_dirent *next;
1641 const char *name;
1642 int len;
1643 struct inode *inode = NULL;
1644
1645 next = list_entry(p, struct configfs_dirent, s_sibling);
1646 if (!next->s_element)
1647 continue;
1648
1649 /*
1650 * We'll have a dentry and an inode for
1651 * PINNED items and for open attribute
1652 * files. We lock here to prevent a race
1653 * with configfs_d_iput() clearing
1654 * s_dentry before calling iput().
1655 *
1656 * Why do we go to the trouble? If
1657 * someone has an attribute file open,
1658 * the inode number should match until
1659 * they close it. Beyond that, we don't
1660 * care.
1661 */
1662 dentry = next->s_dentry;
1663 if (dentry)
1664 inode = d_inode(dentry);
1665 if (inode)
1666 ino = inode->i_ino;
1667 spin_unlock(&configfs_dirent_lock);
1668 if (!inode)
1669 ino = iunique(sb, 2);
1670
1671 name = configfs_get_name(next);
1672 len = strlen(name);
1673
1674 if (!dir_emit(ctx, name, len, ino, dt_type(next)))
1675 return 0;
1676
1677 spin_lock(&configfs_dirent_lock);
1678 list_move(q, p);
1679 p = q;
1680 ctx->pos++;
1681 }
1682 spin_unlock(&configfs_dirent_lock);
1683 return 0;
1684 }
1685
1686 static loff_t configfs_dir_lseek(struct file *file, loff_t offset, int whence)
1687 {
1688 struct dentry * dentry = file->f_path.dentry;
1689
1690 switch (whence) {
1691 case 1:
1692 offset += file->f_pos;
1693 fallthrough;
1694 case 0:
1695 if (offset >= 0)
1696 break;
1697 fallthrough;
1698 default:
1699 return -EINVAL;
1700 }
1701 if (offset != file->f_pos) {
1702 file->f_pos = offset;
1703 if (file->f_pos >= 2) {
1704 struct configfs_dirent *sd = dentry->d_fsdata;
1705 struct configfs_dirent *cursor = file->private_data;
1706 struct list_head *p;
1707 loff_t n = file->f_pos - 2;
1708
1709 spin_lock(&configfs_dirent_lock);
1710 list_del(&cursor->s_sibling);
1711 p = sd->s_children.next;
1712 while (n && p != &sd->s_children) {
1713 struct configfs_dirent *next;
1714 next = list_entry(p, struct configfs_dirent,
1715 s_sibling);
1716 if (next->s_element)
1717 n--;
1718 p = p->next;
1719 }
1720 list_add_tail(&cursor->s_sibling, p);
1721 spin_unlock(&configfs_dirent_lock);
1722 }
1723 }
1724 return offset;
1725 }
1726
1727 const struct file_operations configfs_dir_operations = {
1728 .open = configfs_dir_open,
1729 .release = configfs_dir_close,
1730 .llseek = configfs_dir_lseek,
1731 .read = generic_read_dir,
1732 .iterate_shared = configfs_readdir,
1733 };
1734
1735 /**
1736 * configfs_register_group - creates a parent-child relation between two groups
1737 * @parent_group: parent group
1738 * @group: child group
1739 *
1740 * link groups, creates dentry for the child and attaches it to the
1741 * parent dentry.
1742 *
1743 * Return: 0 on success, negative errno code on error
1744 */
1745 int configfs_register_group(struct config_group *parent_group,
1746 struct config_group *group)
1747 {
1748 struct configfs_subsystem *subsys = parent_group->cg_subsys;
1749 struct dentry *parent;
1750 struct configfs_fragment *frag;
1751 int ret;
1752
1753 frag = new_fragment();
1754 if (!frag)
1755 return -ENOMEM;
1756
1757 mutex_lock(&subsys->su_mutex);
1758 link_group(parent_group, group);
1759 mutex_unlock(&subsys->su_mutex);
1760
1761 parent = parent_group->cg_item.ci_dentry;
1762
1763 inode_lock_nested(d_inode(parent), I_MUTEX_PARENT);
1764 ret = create_default_group(parent_group, group, frag);
1765 if (ret)
1766 goto err_out;
1767
1768 spin_lock(&configfs_dirent_lock);
1769 configfs_dir_set_ready(group->cg_item.ci_dentry->d_fsdata);
1770 spin_unlock(&configfs_dirent_lock);
1771 inode_unlock(d_inode(parent));
1772 put_fragment(frag);
1773 return 0;
1774 err_out:
1775 inode_unlock(d_inode(parent));
1776 mutex_lock(&subsys->su_mutex);
1777 unlink_group(group);
1778 mutex_unlock(&subsys->su_mutex);
1779 put_fragment(frag);
1780 return ret;
1781 }
1782 EXPORT_SYMBOL(configfs_register_group);
1783
1784 /**
1785 * configfs_unregister_group() - unregisters a child group from its parent
1786 * @group: parent group to be unregistered
1787 *
1788 * Undoes configfs_register_group()
1789 */
1790 void configfs_unregister_group(struct config_group *group)
1791 {
1792 struct configfs_subsystem *subsys = group->cg_subsys;
1793 struct dentry *dentry = group->cg_item.ci_dentry;
1794 struct dentry *parent = group->cg_item.ci_parent->ci_dentry;
1795 struct configfs_dirent *sd = dentry->d_fsdata;
1796 struct configfs_fragment *frag = sd->s_frag;
1797
1798 down_write(&frag->frag_sem);
1799 frag->frag_dead = true;
1800 up_write(&frag->frag_sem);
1801
1802 inode_lock_nested(d_inode(parent), I_MUTEX_PARENT);
1803 spin_lock(&configfs_dirent_lock);
1804 configfs_detach_prep(dentry, NULL);
1805 spin_unlock(&configfs_dirent_lock);
1806
1807 configfs_detach_group(&group->cg_item);
1808 d_inode(dentry)->i_flags |= S_DEAD;
1809 dont_mount(dentry);
1810 fsnotify_rmdir(d_inode(parent), dentry);
1811 d_delete(dentry);
1812 inode_unlock(d_inode(parent));
1813
1814 dput(dentry);
1815
1816 mutex_lock(&subsys->su_mutex);
1817 unlink_group(group);
1818 mutex_unlock(&subsys->su_mutex);
1819 }
1820 EXPORT_SYMBOL(configfs_unregister_group);
1821
1822 /**
1823 * configfs_register_default_group() - allocates and registers a child group
1824 * @parent_group: parent group
1825 * @name: child group name
1826 * @item_type: child item type description
1827 *
1828 * boilerplate to allocate and register a child group with its parent. We need
1829 * kzalloc'ed memory because child's default_group is initially empty.
1830 *
1831 * Return: allocated config group or ERR_PTR() on error
1832 */
1833 struct config_group *
1834 configfs_register_default_group(struct config_group *parent_group,
1835 const char *name,
1836 const struct config_item_type *item_type)
1837 {
1838 int ret;
1839 struct config_group *group;
1840
1841 group = kzalloc(sizeof(*group), GFP_KERNEL);
1842 if (!group)
1843 return ERR_PTR(-ENOMEM);
1844 config_group_init_type_name(group, name, item_type);
1845
1846 ret = configfs_register_group(parent_group, group);
1847 if (ret) {
1848 kfree(group);
1849 return ERR_PTR(ret);
1850 }
1851 return group;
1852 }
1853 EXPORT_SYMBOL(configfs_register_default_group);
1854
1855 /**
1856 * configfs_unregister_default_group() - unregisters and frees a child group
1857 * @group: the group to act on
1858 */
1859 void configfs_unregister_default_group(struct config_group *group)
1860 {
1861 configfs_unregister_group(group);
1862 kfree(group);
1863 }
1864 EXPORT_SYMBOL(configfs_unregister_default_group);
1865
1866 int configfs_register_subsystem(struct configfs_subsystem *subsys)
1867 {
1868 int err;
1869 struct config_group *group = &subsys->su_group;
1870 struct dentry *dentry;
1871 struct dentry *root;
1872 struct configfs_dirent *sd;
1873 struct configfs_fragment *frag;
1874
1875 frag = new_fragment();
1876 if (!frag)
1877 return -ENOMEM;
1878
1879 root = configfs_pin_fs();
1880 if (IS_ERR(root)) {
1881 put_fragment(frag);
1882 return PTR_ERR(root);
1883 }
1884
1885 if (!group->cg_item.ci_name)
1886 group->cg_item.ci_name = group->cg_item.ci_namebuf;
1887
1888 sd = root->d_fsdata;
1889 link_group(to_config_group(sd->s_element), group);
1890
1891 inode_lock_nested(d_inode(root), I_MUTEX_PARENT);
1892
1893 err = -ENOMEM;
1894 dentry = d_alloc_name(root, group->cg_item.ci_name);
1895 if (dentry) {
1896 d_add(dentry, NULL);
1897
1898 err = configfs_attach_group(sd->s_element, &group->cg_item,
1899 dentry, frag);
1900 if (err) {
1901 BUG_ON(d_inode(dentry));
1902 d_drop(dentry);
1903 dput(dentry);
1904 } else {
1905 spin_lock(&configfs_dirent_lock);
1906 configfs_dir_set_ready(dentry->d_fsdata);
1907 spin_unlock(&configfs_dirent_lock);
1908 }
1909 }
1910
1911 inode_unlock(d_inode(root));
1912
1913 if (err) {
1914 unlink_group(group);
1915 configfs_release_fs();
1916 }
1917 put_fragment(frag);
1918
1919 return err;
1920 }
1921
1922 void configfs_unregister_subsystem(struct configfs_subsystem *subsys)
1923 {
1924 struct config_group *group = &subsys->su_group;
1925 struct dentry *dentry = group->cg_item.ci_dentry;
1926 struct dentry *root = dentry->d_sb->s_root;
1927 struct configfs_dirent *sd = dentry->d_fsdata;
1928 struct configfs_fragment *frag = sd->s_frag;
1929
1930 if (dentry->d_parent != root) {
1931 pr_err("Tried to unregister non-subsystem!\n");
1932 return;
1933 }
1934
1935 down_write(&frag->frag_sem);
1936 frag->frag_dead = true;
1937 up_write(&frag->frag_sem);
1938
1939 inode_lock_nested(d_inode(root),
1940 I_MUTEX_PARENT);
1941 inode_lock_nested(d_inode(dentry), I_MUTEX_CHILD);
1942 mutex_lock(&configfs_symlink_mutex);
1943 spin_lock(&configfs_dirent_lock);
1944 if (configfs_detach_prep(dentry, NULL)) {
1945 pr_err("Tried to unregister non-empty subsystem!\n");
1946 }
1947 spin_unlock(&configfs_dirent_lock);
1948 mutex_unlock(&configfs_symlink_mutex);
1949 configfs_detach_group(&group->cg_item);
1950 d_inode(dentry)->i_flags |= S_DEAD;
1951 dont_mount(dentry);
1952 fsnotify_rmdir(d_inode(root), dentry);
1953 inode_unlock(d_inode(dentry));
1954
1955 d_delete(dentry);
1956
1957 inode_unlock(d_inode(root));
1958
1959 dput(dentry);
1960
1961 unlink_group(group);
1962 configfs_release_fs();
1963 }
1964
1965 EXPORT_SYMBOL(configfs_register_subsystem);
1966 EXPORT_SYMBOL(configfs_unregister_subsystem);