xref: /linux/fs/configfs/dir.c (revision a4eb44a6435d6d8f9e642407a4a06f65eb90ca04)
1 // SPDX-License-Identifier: GPL-2.0-or-later
2 /*
3  * dir.c - Operations for configfs directories.
4  *
5  * Based on sysfs:
6  * 	sysfs is Copyright (C) 2001, 2002, 2003 Patrick Mochel
7  *
8  * configfs Copyright (C) 2005 Oracle.  All rights reserved.
9  */
10 
11 #undef DEBUG
12 
13 #include <linux/fs.h>
14 #include <linux/fsnotify.h>
15 #include <linux/mount.h>
16 #include <linux/module.h>
17 #include <linux/slab.h>
18 #include <linux/err.h>
19 
20 #include <linux/configfs.h>
21 #include "configfs_internal.h"
22 
23 /*
24  * Protects mutations of configfs_dirent linkage together with proper i_mutex
25  * Also protects mutations of symlinks linkage to target configfs_dirent
26  * Mutators of configfs_dirent linkage must *both* have the proper inode locked
27  * and configfs_dirent_lock locked, in that order.
28  * This allows one to safely traverse configfs_dirent trees and symlinks without
29  * having to lock inodes.
30  *
31  * Protects setting of CONFIGFS_USET_DROPPING: checking the flag
32  * unlocked is not reliable unless in detach_groups() called from
33  * rmdir()/unregister() and from configfs_attach_group()
34  */
35 DEFINE_SPINLOCK(configfs_dirent_lock);
36 
37 /*
38  * All of link_obj/unlink_obj/link_group/unlink_group require that
39  * subsys->su_mutex is held.
40  * But parent configfs_subsystem is NULL when config_item is root.
41  * Use this mutex when config_item is root.
42  */
43 static DEFINE_MUTEX(configfs_subsystem_mutex);
44 
45 static void configfs_d_iput(struct dentry * dentry,
46 			    struct inode * inode)
47 {
48 	struct configfs_dirent *sd = dentry->d_fsdata;
49 
50 	if (sd) {
51 		/* Coordinate with configfs_readdir */
52 		spin_lock(&configfs_dirent_lock);
53 		/*
54 		 * Set sd->s_dentry to null only when this dentry is the one
55 		 * that is going to be killed.  Otherwise configfs_d_iput may
56 		 * run just after configfs_lookup and set sd->s_dentry to
57 		 * NULL even it's still in use.
58 		 */
59 		if (sd->s_dentry == dentry)
60 			sd->s_dentry = NULL;
61 
62 		spin_unlock(&configfs_dirent_lock);
63 		configfs_put(sd);
64 	}
65 	iput(inode);
66 }
67 
68 const struct dentry_operations configfs_dentry_ops = {
69 	.d_iput		= configfs_d_iput,
70 	.d_delete	= always_delete_dentry,
71 };
72 
73 #ifdef CONFIG_LOCKDEP
74 
75 /*
76  * Helpers to make lockdep happy with our recursive locking of default groups'
77  * inodes (see configfs_attach_group() and configfs_detach_group()).
78  * We put default groups i_mutexes in separate classes according to their depth
79  * from the youngest non-default group ancestor.
80  *
81  * For a non-default group A having default groups A/B, A/C, and A/C/D, default
82  * groups A/B and A/C will have their inode's mutex in class
83  * default_group_class[0], and default group A/C/D will be in
84  * default_group_class[1].
85  *
86  * The lock classes are declared and assigned in inode.c, according to the
87  * s_depth value.
88  * The s_depth value is initialized to -1, adjusted to >= 0 when attaching
89  * default groups, and reset to -1 when all default groups are attached. During
90  * attachment, if configfs_create() sees s_depth > 0, the lock class of the new
91  * inode's mutex is set to default_group_class[s_depth - 1].
92  */
93 
94 static void configfs_init_dirent_depth(struct configfs_dirent *sd)
95 {
96 	sd->s_depth = -1;
97 }
98 
99 static void configfs_set_dir_dirent_depth(struct configfs_dirent *parent_sd,
100 					  struct configfs_dirent *sd)
101 {
102 	int parent_depth = parent_sd->s_depth;
103 
104 	if (parent_depth >= 0)
105 		sd->s_depth = parent_depth + 1;
106 }
107 
108 static void
109 configfs_adjust_dir_dirent_depth_before_populate(struct configfs_dirent *sd)
110 {
111 	/*
112 	 * item's i_mutex class is already setup, so s_depth is now only
113 	 * used to set new sub-directories s_depth, which is always done
114 	 * with item's i_mutex locked.
115 	 */
116 	/*
117 	 *  sd->s_depth == -1 iff we are a non default group.
118 	 *  else (we are a default group) sd->s_depth > 0 (see
119 	 *  create_dir()).
120 	 */
121 	if (sd->s_depth == -1)
122 		/*
123 		 * We are a non default group and we are going to create
124 		 * default groups.
125 		 */
126 		sd->s_depth = 0;
127 }
128 
129 static void
130 configfs_adjust_dir_dirent_depth_after_populate(struct configfs_dirent *sd)
131 {
132 	/* We will not create default groups anymore. */
133 	sd->s_depth = -1;
134 }
135 
136 #else /* CONFIG_LOCKDEP */
137 
138 static void configfs_init_dirent_depth(struct configfs_dirent *sd)
139 {
140 }
141 
142 static void configfs_set_dir_dirent_depth(struct configfs_dirent *parent_sd,
143 					  struct configfs_dirent *sd)
144 {
145 }
146 
147 static void
148 configfs_adjust_dir_dirent_depth_before_populate(struct configfs_dirent *sd)
149 {
150 }
151 
152 static void
153 configfs_adjust_dir_dirent_depth_after_populate(struct configfs_dirent *sd)
154 {
155 }
156 
157 #endif /* CONFIG_LOCKDEP */
158 
159 static struct configfs_fragment *new_fragment(void)
160 {
161 	struct configfs_fragment *p;
162 
163 	p = kmalloc(sizeof(struct configfs_fragment), GFP_KERNEL);
164 	if (p) {
165 		atomic_set(&p->frag_count, 1);
166 		init_rwsem(&p->frag_sem);
167 		p->frag_dead = false;
168 	}
169 	return p;
170 }
171 
172 void put_fragment(struct configfs_fragment *frag)
173 {
174 	if (frag && atomic_dec_and_test(&frag->frag_count))
175 		kfree(frag);
176 }
177 
178 struct configfs_fragment *get_fragment(struct configfs_fragment *frag)
179 {
180 	if (likely(frag))
181 		atomic_inc(&frag->frag_count);
182 	return frag;
183 }
184 
185 /*
186  * Allocates a new configfs_dirent and links it to the parent configfs_dirent
187  */
188 static struct configfs_dirent *configfs_new_dirent(struct configfs_dirent *parent_sd,
189 						   void *element, int type,
190 						   struct configfs_fragment *frag)
191 {
192 	struct configfs_dirent * sd;
193 
194 	sd = kmem_cache_zalloc(configfs_dir_cachep, GFP_KERNEL);
195 	if (!sd)
196 		return ERR_PTR(-ENOMEM);
197 
198 	atomic_set(&sd->s_count, 1);
199 	INIT_LIST_HEAD(&sd->s_children);
200 	sd->s_element = element;
201 	sd->s_type = type;
202 	configfs_init_dirent_depth(sd);
203 	spin_lock(&configfs_dirent_lock);
204 	if (parent_sd->s_type & CONFIGFS_USET_DROPPING) {
205 		spin_unlock(&configfs_dirent_lock);
206 		kmem_cache_free(configfs_dir_cachep, sd);
207 		return ERR_PTR(-ENOENT);
208 	}
209 	sd->s_frag = get_fragment(frag);
210 	list_add(&sd->s_sibling, &parent_sd->s_children);
211 	spin_unlock(&configfs_dirent_lock);
212 
213 	return sd;
214 }
215 
216 /*
217  *
218  * Return -EEXIST if there is already a configfs element with the same
219  * name for the same parent.
220  *
221  * called with parent inode's i_mutex held
222  */
223 static int configfs_dirent_exists(struct configfs_dirent *parent_sd,
224 				  const unsigned char *new)
225 {
226 	struct configfs_dirent * sd;
227 
228 	list_for_each_entry(sd, &parent_sd->s_children, s_sibling) {
229 		if (sd->s_element) {
230 			const unsigned char *existing = configfs_get_name(sd);
231 			if (strcmp(existing, new))
232 				continue;
233 			else
234 				return -EEXIST;
235 		}
236 	}
237 
238 	return 0;
239 }
240 
241 
242 int configfs_make_dirent(struct configfs_dirent * parent_sd,
243 			 struct dentry * dentry, void * element,
244 			 umode_t mode, int type, struct configfs_fragment *frag)
245 {
246 	struct configfs_dirent * sd;
247 
248 	sd = configfs_new_dirent(parent_sd, element, type, frag);
249 	if (IS_ERR(sd))
250 		return PTR_ERR(sd);
251 
252 	sd->s_mode = mode;
253 	sd->s_dentry = dentry;
254 	if (dentry)
255 		dentry->d_fsdata = configfs_get(sd);
256 
257 	return 0;
258 }
259 
260 static void configfs_remove_dirent(struct dentry *dentry)
261 {
262 	struct configfs_dirent *sd = dentry->d_fsdata;
263 
264 	if (!sd)
265 		return;
266 	spin_lock(&configfs_dirent_lock);
267 	list_del_init(&sd->s_sibling);
268 	spin_unlock(&configfs_dirent_lock);
269 	configfs_put(sd);
270 }
271 
272 /**
273  *	configfs_create_dir - create a directory for an config_item.
274  *	@item:		config_itemwe're creating directory for.
275  *	@dentry:	config_item's dentry.
276  *	@frag:		config_item's fragment.
277  *
278  *	Note: user-created entries won't be allowed under this new directory
279  *	until it is validated by configfs_dir_set_ready()
280  */
281 
282 static int configfs_create_dir(struct config_item *item, struct dentry *dentry,
283 				struct configfs_fragment *frag)
284 {
285 	int error;
286 	umode_t mode = S_IFDIR| S_IRWXU | S_IRUGO | S_IXUGO;
287 	struct dentry *p = dentry->d_parent;
288 	struct inode *inode;
289 
290 	BUG_ON(!item);
291 
292 	error = configfs_dirent_exists(p->d_fsdata, dentry->d_name.name);
293 	if (unlikely(error))
294 		return error;
295 
296 	error = configfs_make_dirent(p->d_fsdata, dentry, item, mode,
297 				     CONFIGFS_DIR | CONFIGFS_USET_CREATING,
298 				     frag);
299 	if (unlikely(error))
300 		return error;
301 
302 	configfs_set_dir_dirent_depth(p->d_fsdata, dentry->d_fsdata);
303 	inode = configfs_create(dentry, mode);
304 	if (IS_ERR(inode))
305 		goto out_remove;
306 
307 	inode->i_op = &configfs_dir_inode_operations;
308 	inode->i_fop = &configfs_dir_operations;
309 	/* directory inodes start off with i_nlink == 2 (for "." entry) */
310 	inc_nlink(inode);
311 	d_instantiate(dentry, inode);
312 	/* already hashed */
313 	dget(dentry);  /* pin directory dentries in core */
314 	inc_nlink(d_inode(p));
315 	item->ci_dentry = dentry;
316 	return 0;
317 
318 out_remove:
319 	configfs_remove_dirent(dentry);
320 	return PTR_ERR(inode);
321 }
322 
323 /*
324  * Allow userspace to create new entries under a new directory created with
325  * configfs_create_dir(), and under all of its chidlren directories recursively.
326  * @sd		configfs_dirent of the new directory to validate
327  *
328  * Caller must hold configfs_dirent_lock.
329  */
330 static void configfs_dir_set_ready(struct configfs_dirent *sd)
331 {
332 	struct configfs_dirent *child_sd;
333 
334 	sd->s_type &= ~CONFIGFS_USET_CREATING;
335 	list_for_each_entry(child_sd, &sd->s_children, s_sibling)
336 		if (child_sd->s_type & CONFIGFS_USET_CREATING)
337 			configfs_dir_set_ready(child_sd);
338 }
339 
340 /*
341  * Check that a directory does not belong to a directory hierarchy being
342  * attached and not validated yet.
343  * @sd		configfs_dirent of the directory to check
344  *
345  * @return	non-zero iff the directory was validated
346  *
347  * Note: takes configfs_dirent_lock, so the result may change from false to true
348  * in two consecutive calls, but never from true to false.
349  */
350 int configfs_dirent_is_ready(struct configfs_dirent *sd)
351 {
352 	int ret;
353 
354 	spin_lock(&configfs_dirent_lock);
355 	ret = !(sd->s_type & CONFIGFS_USET_CREATING);
356 	spin_unlock(&configfs_dirent_lock);
357 
358 	return ret;
359 }
360 
361 int configfs_create_link(struct configfs_dirent *target, struct dentry *parent,
362 		struct dentry *dentry, char *body)
363 {
364 	int err = 0;
365 	umode_t mode = S_IFLNK | S_IRWXUGO;
366 	struct configfs_dirent *p = parent->d_fsdata;
367 	struct inode *inode;
368 
369 	err = configfs_make_dirent(p, dentry, target, mode, CONFIGFS_ITEM_LINK,
370 			p->s_frag);
371 	if (err)
372 		return err;
373 
374 	inode = configfs_create(dentry, mode);
375 	if (IS_ERR(inode))
376 		goto out_remove;
377 
378 	inode->i_link = body;
379 	inode->i_op = &configfs_symlink_inode_operations;
380 	d_instantiate(dentry, inode);
381 	dget(dentry);  /* pin link dentries in core */
382 	return 0;
383 
384 out_remove:
385 	configfs_remove_dirent(dentry);
386 	return PTR_ERR(inode);
387 }
388 
389 static void remove_dir(struct dentry * d)
390 {
391 	struct dentry * parent = dget(d->d_parent);
392 
393 	configfs_remove_dirent(d);
394 
395 	if (d_really_is_positive(d))
396 		simple_rmdir(d_inode(parent),d);
397 
398 	pr_debug(" o %pd removing done (%d)\n", d, d_count(d));
399 
400 	dput(parent);
401 }
402 
403 /**
404  * configfs_remove_dir - remove an config_item's directory.
405  * @item:	config_item we're removing.
406  *
407  * The only thing special about this is that we remove any files in
408  * the directory before we remove the directory, and we've inlined
409  * what used to be configfs_rmdir() below, instead of calling separately.
410  *
411  * Caller holds the mutex of the item's inode
412  */
413 
414 static void configfs_remove_dir(struct config_item * item)
415 {
416 	struct dentry * dentry = dget(item->ci_dentry);
417 
418 	if (!dentry)
419 		return;
420 
421 	remove_dir(dentry);
422 	/**
423 	 * Drop reference from dget() on entrance.
424 	 */
425 	dput(dentry);
426 }
427 
428 static struct dentry * configfs_lookup(struct inode *dir,
429 				       struct dentry *dentry,
430 				       unsigned int flags)
431 {
432 	struct configfs_dirent * parent_sd = dentry->d_parent->d_fsdata;
433 	struct configfs_dirent * sd;
434 	struct inode *inode = NULL;
435 
436 	if (dentry->d_name.len > NAME_MAX)
437 		return ERR_PTR(-ENAMETOOLONG);
438 
439 	/*
440 	 * Fake invisibility if dir belongs to a group/default groups hierarchy
441 	 * being attached
442 	 *
443 	 * This forbids userspace to read/write attributes of items which may
444 	 * not complete their initialization, since the dentries of the
445 	 * attributes won't be instantiated.
446 	 */
447 	if (!configfs_dirent_is_ready(parent_sd))
448 		return ERR_PTR(-ENOENT);
449 
450 	spin_lock(&configfs_dirent_lock);
451 	list_for_each_entry(sd, &parent_sd->s_children, s_sibling) {
452 		if ((sd->s_type & CONFIGFS_NOT_PINNED) &&
453 		    !strcmp(configfs_get_name(sd), dentry->d_name.name)) {
454 			struct configfs_attribute *attr = sd->s_element;
455 			umode_t mode = (attr->ca_mode & S_IALLUGO) | S_IFREG;
456 
457 			dentry->d_fsdata = configfs_get(sd);
458 			sd->s_dentry = dentry;
459 			spin_unlock(&configfs_dirent_lock);
460 
461 			inode = configfs_create(dentry, mode);
462 			if (IS_ERR(inode)) {
463 				configfs_put(sd);
464 				return ERR_CAST(inode);
465 			}
466 			if (sd->s_type & CONFIGFS_ITEM_BIN_ATTR) {
467 				inode->i_size = 0;
468 				inode->i_fop = &configfs_bin_file_operations;
469 			} else {
470 				inode->i_size = PAGE_SIZE;
471 				inode->i_fop = &configfs_file_operations;
472 			}
473 			goto done;
474 		}
475 	}
476 	spin_unlock(&configfs_dirent_lock);
477 done:
478 	d_add(dentry, inode);
479 	return NULL;
480 }
481 
482 /*
483  * Only subdirectories count here.  Files (CONFIGFS_NOT_PINNED) are
484  * attributes and are removed by rmdir().  We recurse, setting
485  * CONFIGFS_USET_DROPPING on all children that are candidates for
486  * default detach.
487  * If there is an error, the caller will reset the flags via
488  * configfs_detach_rollback().
489  */
490 static int configfs_detach_prep(struct dentry *dentry, struct dentry **wait)
491 {
492 	struct configfs_dirent *parent_sd = dentry->d_fsdata;
493 	struct configfs_dirent *sd;
494 	int ret;
495 
496 	/* Mark that we're trying to drop the group */
497 	parent_sd->s_type |= CONFIGFS_USET_DROPPING;
498 
499 	ret = -EBUSY;
500 	if (parent_sd->s_links)
501 		goto out;
502 
503 	ret = 0;
504 	list_for_each_entry(sd, &parent_sd->s_children, s_sibling) {
505 		if (!sd->s_element ||
506 		    (sd->s_type & CONFIGFS_NOT_PINNED))
507 			continue;
508 		if (sd->s_type & CONFIGFS_USET_DEFAULT) {
509 			/* Abort if racing with mkdir() */
510 			if (sd->s_type & CONFIGFS_USET_IN_MKDIR) {
511 				if (wait)
512 					*wait= dget(sd->s_dentry);
513 				return -EAGAIN;
514 			}
515 
516 			/*
517 			 * Yup, recursive.  If there's a problem, blame
518 			 * deep nesting of default_groups
519 			 */
520 			ret = configfs_detach_prep(sd->s_dentry, wait);
521 			if (!ret)
522 				continue;
523 		} else
524 			ret = -ENOTEMPTY;
525 
526 		break;
527 	}
528 
529 out:
530 	return ret;
531 }
532 
533 /*
534  * Walk the tree, resetting CONFIGFS_USET_DROPPING wherever it was
535  * set.
536  */
537 static void configfs_detach_rollback(struct dentry *dentry)
538 {
539 	struct configfs_dirent *parent_sd = dentry->d_fsdata;
540 	struct configfs_dirent *sd;
541 
542 	parent_sd->s_type &= ~CONFIGFS_USET_DROPPING;
543 
544 	list_for_each_entry(sd, &parent_sd->s_children, s_sibling)
545 		if (sd->s_type & CONFIGFS_USET_DEFAULT)
546 			configfs_detach_rollback(sd->s_dentry);
547 }
548 
549 static void detach_attrs(struct config_item * item)
550 {
551 	struct dentry * dentry = dget(item->ci_dentry);
552 	struct configfs_dirent * parent_sd;
553 	struct configfs_dirent * sd, * tmp;
554 
555 	if (!dentry)
556 		return;
557 
558 	pr_debug("configfs %s: dropping attrs for  dir\n",
559 		 dentry->d_name.name);
560 
561 	parent_sd = dentry->d_fsdata;
562 	list_for_each_entry_safe(sd, tmp, &parent_sd->s_children, s_sibling) {
563 		if (!sd->s_element || !(sd->s_type & CONFIGFS_NOT_PINNED))
564 			continue;
565 		spin_lock(&configfs_dirent_lock);
566 		list_del_init(&sd->s_sibling);
567 		spin_unlock(&configfs_dirent_lock);
568 		configfs_drop_dentry(sd, dentry);
569 		configfs_put(sd);
570 	}
571 
572 	/**
573 	 * Drop reference from dget() on entrance.
574 	 */
575 	dput(dentry);
576 }
577 
578 static int populate_attrs(struct config_item *item)
579 {
580 	const struct config_item_type *t = item->ci_type;
581 	struct configfs_attribute *attr;
582 	struct configfs_bin_attribute *bin_attr;
583 	int error = 0;
584 	int i;
585 
586 	if (!t)
587 		return -EINVAL;
588 	if (t->ct_attrs) {
589 		for (i = 0; (attr = t->ct_attrs[i]) != NULL; i++) {
590 			if ((error = configfs_create_file(item, attr)))
591 				break;
592 		}
593 	}
594 	if (t->ct_bin_attrs) {
595 		for (i = 0; (bin_attr = t->ct_bin_attrs[i]) != NULL; i++) {
596 			error = configfs_create_bin_file(item, bin_attr);
597 			if (error)
598 				break;
599 		}
600 	}
601 
602 	if (error)
603 		detach_attrs(item);
604 
605 	return error;
606 }
607 
608 static int configfs_attach_group(struct config_item *parent_item,
609 				 struct config_item *item,
610 				 struct dentry *dentry,
611 				 struct configfs_fragment *frag);
612 static void configfs_detach_group(struct config_item *item);
613 
614 static void detach_groups(struct config_group *group)
615 {
616 	struct dentry * dentry = dget(group->cg_item.ci_dentry);
617 	struct dentry *child;
618 	struct configfs_dirent *parent_sd;
619 	struct configfs_dirent *sd, *tmp;
620 
621 	if (!dentry)
622 		return;
623 
624 	parent_sd = dentry->d_fsdata;
625 	list_for_each_entry_safe(sd, tmp, &parent_sd->s_children, s_sibling) {
626 		if (!sd->s_element ||
627 		    !(sd->s_type & CONFIGFS_USET_DEFAULT))
628 			continue;
629 
630 		child = sd->s_dentry;
631 
632 		inode_lock(d_inode(child));
633 
634 		configfs_detach_group(sd->s_element);
635 		d_inode(child)->i_flags |= S_DEAD;
636 		dont_mount(child);
637 
638 		inode_unlock(d_inode(child));
639 
640 		d_delete(child);
641 		dput(child);
642 	}
643 
644 	/**
645 	 * Drop reference from dget() on entrance.
646 	 */
647 	dput(dentry);
648 }
649 
650 /*
651  * This fakes mkdir(2) on a default_groups[] entry.  It
652  * creates a dentry, attachs it, and then does fixup
653  * on the sd->s_type.
654  *
655  * We could, perhaps, tweak our parent's ->mkdir for a minute and
656  * try using vfs_mkdir.  Just a thought.
657  */
658 static int create_default_group(struct config_group *parent_group,
659 				struct config_group *group,
660 				struct configfs_fragment *frag)
661 {
662 	int ret;
663 	struct configfs_dirent *sd;
664 	/* We trust the caller holds a reference to parent */
665 	struct dentry *child, *parent = parent_group->cg_item.ci_dentry;
666 
667 	if (!group->cg_item.ci_name)
668 		group->cg_item.ci_name = group->cg_item.ci_namebuf;
669 
670 	ret = -ENOMEM;
671 	child = d_alloc_name(parent, group->cg_item.ci_name);
672 	if (child) {
673 		d_add(child, NULL);
674 
675 		ret = configfs_attach_group(&parent_group->cg_item,
676 					    &group->cg_item, child, frag);
677 		if (!ret) {
678 			sd = child->d_fsdata;
679 			sd->s_type |= CONFIGFS_USET_DEFAULT;
680 		} else {
681 			BUG_ON(d_inode(child));
682 			d_drop(child);
683 			dput(child);
684 		}
685 	}
686 
687 	return ret;
688 }
689 
690 static int populate_groups(struct config_group *group,
691 			   struct configfs_fragment *frag)
692 {
693 	struct config_group *new_group;
694 	int ret = 0;
695 
696 	list_for_each_entry(new_group, &group->default_groups, group_entry) {
697 		ret = create_default_group(group, new_group, frag);
698 		if (ret) {
699 			detach_groups(group);
700 			break;
701 		}
702 	}
703 
704 	return ret;
705 }
706 
707 void configfs_remove_default_groups(struct config_group *group)
708 {
709 	struct config_group *g, *n;
710 
711 	list_for_each_entry_safe(g, n, &group->default_groups, group_entry) {
712 		list_del(&g->group_entry);
713 		config_item_put(&g->cg_item);
714 	}
715 }
716 EXPORT_SYMBOL(configfs_remove_default_groups);
717 
718 /*
719  * All of link_obj/unlink_obj/link_group/unlink_group require that
720  * subsys->su_mutex is held.
721  */
722 
723 static void unlink_obj(struct config_item *item)
724 {
725 	struct config_group *group;
726 
727 	group = item->ci_group;
728 	if (group) {
729 		list_del_init(&item->ci_entry);
730 
731 		item->ci_group = NULL;
732 		item->ci_parent = NULL;
733 
734 		/* Drop the reference for ci_entry */
735 		config_item_put(item);
736 
737 		/* Drop the reference for ci_parent */
738 		config_group_put(group);
739 	}
740 }
741 
742 static void link_obj(struct config_item *parent_item, struct config_item *item)
743 {
744 	/*
745 	 * Parent seems redundant with group, but it makes certain
746 	 * traversals much nicer.
747 	 */
748 	item->ci_parent = parent_item;
749 
750 	/*
751 	 * We hold a reference on the parent for the child's ci_parent
752 	 * link.
753 	 */
754 	item->ci_group = config_group_get(to_config_group(parent_item));
755 	list_add_tail(&item->ci_entry, &item->ci_group->cg_children);
756 
757 	/*
758 	 * We hold a reference on the child for ci_entry on the parent's
759 	 * cg_children
760 	 */
761 	config_item_get(item);
762 }
763 
764 static void unlink_group(struct config_group *group)
765 {
766 	struct config_group *new_group;
767 
768 	list_for_each_entry(new_group, &group->default_groups, group_entry)
769 		unlink_group(new_group);
770 
771 	group->cg_subsys = NULL;
772 	unlink_obj(&group->cg_item);
773 }
774 
775 static void link_group(struct config_group *parent_group, struct config_group *group)
776 {
777 	struct config_group *new_group;
778 	struct configfs_subsystem *subsys = NULL; /* gcc is a turd */
779 
780 	link_obj(&parent_group->cg_item, &group->cg_item);
781 
782 	if (parent_group->cg_subsys)
783 		subsys = parent_group->cg_subsys;
784 	else if (configfs_is_root(&parent_group->cg_item))
785 		subsys = to_configfs_subsystem(group);
786 	else
787 		BUG();
788 	group->cg_subsys = subsys;
789 
790 	list_for_each_entry(new_group, &group->default_groups, group_entry)
791 		link_group(group, new_group);
792 }
793 
794 /*
795  * The goal is that configfs_attach_item() (and
796  * configfs_attach_group()) can be called from either the VFS or this
797  * module.  That is, they assume that the items have been created,
798  * the dentry allocated, and the dcache is all ready to go.
799  *
800  * If they fail, they must clean up after themselves as if they
801  * had never been called.  The caller (VFS or local function) will
802  * handle cleaning up the dcache bits.
803  *
804  * configfs_detach_group() and configfs_detach_item() behave similarly on
805  * the way out.  They assume that the proper semaphores are held, they
806  * clean up the configfs items, and they expect their callers will
807  * handle the dcache bits.
808  */
809 static int configfs_attach_item(struct config_item *parent_item,
810 				struct config_item *item,
811 				struct dentry *dentry,
812 				struct configfs_fragment *frag)
813 {
814 	int ret;
815 
816 	ret = configfs_create_dir(item, dentry, frag);
817 	if (!ret) {
818 		ret = populate_attrs(item);
819 		if (ret) {
820 			/*
821 			 * We are going to remove an inode and its dentry but
822 			 * the VFS may already have hit and used them. Thus,
823 			 * we must lock them as rmdir() would.
824 			 */
825 			inode_lock(d_inode(dentry));
826 			configfs_remove_dir(item);
827 			d_inode(dentry)->i_flags |= S_DEAD;
828 			dont_mount(dentry);
829 			inode_unlock(d_inode(dentry));
830 			d_delete(dentry);
831 		}
832 	}
833 
834 	return ret;
835 }
836 
837 /* Caller holds the mutex of the item's inode */
838 static void configfs_detach_item(struct config_item *item)
839 {
840 	detach_attrs(item);
841 	configfs_remove_dir(item);
842 }
843 
844 static int configfs_attach_group(struct config_item *parent_item,
845 				 struct config_item *item,
846 				 struct dentry *dentry,
847 				 struct configfs_fragment *frag)
848 {
849 	int ret;
850 	struct configfs_dirent *sd;
851 
852 	ret = configfs_attach_item(parent_item, item, dentry, frag);
853 	if (!ret) {
854 		sd = dentry->d_fsdata;
855 		sd->s_type |= CONFIGFS_USET_DIR;
856 
857 		/*
858 		 * FYI, we're faking mkdir in populate_groups()
859 		 * We must lock the group's inode to avoid races with the VFS
860 		 * which can already hit the inode and try to add/remove entries
861 		 * under it.
862 		 *
863 		 * We must also lock the inode to remove it safely in case of
864 		 * error, as rmdir() would.
865 		 */
866 		inode_lock_nested(d_inode(dentry), I_MUTEX_CHILD);
867 		configfs_adjust_dir_dirent_depth_before_populate(sd);
868 		ret = populate_groups(to_config_group(item), frag);
869 		if (ret) {
870 			configfs_detach_item(item);
871 			d_inode(dentry)->i_flags |= S_DEAD;
872 			dont_mount(dentry);
873 		}
874 		configfs_adjust_dir_dirent_depth_after_populate(sd);
875 		inode_unlock(d_inode(dentry));
876 		if (ret)
877 			d_delete(dentry);
878 	}
879 
880 	return ret;
881 }
882 
883 /* Caller holds the mutex of the group's inode */
884 static void configfs_detach_group(struct config_item *item)
885 {
886 	detach_groups(to_config_group(item));
887 	configfs_detach_item(item);
888 }
889 
890 /*
891  * After the item has been detached from the filesystem view, we are
892  * ready to tear it out of the hierarchy.  Notify the client before
893  * we do that so they can perform any cleanup that requires
894  * navigating the hierarchy.  A client does not need to provide this
895  * callback.  The subsystem semaphore MUST be held by the caller, and
896  * references must be valid for both items.  It also assumes the
897  * caller has validated ci_type.
898  */
899 static void client_disconnect_notify(struct config_item *parent_item,
900 				     struct config_item *item)
901 {
902 	const struct config_item_type *type;
903 
904 	type = parent_item->ci_type;
905 	BUG_ON(!type);
906 
907 	if (type->ct_group_ops && type->ct_group_ops->disconnect_notify)
908 		type->ct_group_ops->disconnect_notify(to_config_group(parent_item),
909 						      item);
910 }
911 
912 /*
913  * Drop the initial reference from make_item()/make_group()
914  * This function assumes that reference is held on item
915  * and that item holds a valid reference to the parent.  Also, it
916  * assumes the caller has validated ci_type.
917  */
918 static void client_drop_item(struct config_item *parent_item,
919 			     struct config_item *item)
920 {
921 	const struct config_item_type *type;
922 
923 	type = parent_item->ci_type;
924 	BUG_ON(!type);
925 
926 	/*
927 	 * If ->drop_item() exists, it is responsible for the
928 	 * config_item_put().
929 	 */
930 	if (type->ct_group_ops && type->ct_group_ops->drop_item)
931 		type->ct_group_ops->drop_item(to_config_group(parent_item),
932 					      item);
933 	else
934 		config_item_put(item);
935 }
936 
937 #ifdef DEBUG
938 static void configfs_dump_one(struct configfs_dirent *sd, int level)
939 {
940 	pr_info("%*s\"%s\":\n", level, " ", configfs_get_name(sd));
941 
942 #define type_print(_type) if (sd->s_type & _type) pr_info("%*s %s\n", level, " ", #_type);
943 	type_print(CONFIGFS_ROOT);
944 	type_print(CONFIGFS_DIR);
945 	type_print(CONFIGFS_ITEM_ATTR);
946 	type_print(CONFIGFS_ITEM_LINK);
947 	type_print(CONFIGFS_USET_DIR);
948 	type_print(CONFIGFS_USET_DEFAULT);
949 	type_print(CONFIGFS_USET_DROPPING);
950 #undef type_print
951 }
952 
953 static int configfs_dump(struct configfs_dirent *sd, int level)
954 {
955 	struct configfs_dirent *child_sd;
956 	int ret = 0;
957 
958 	configfs_dump_one(sd, level);
959 
960 	if (!(sd->s_type & (CONFIGFS_DIR|CONFIGFS_ROOT)))
961 		return 0;
962 
963 	list_for_each_entry(child_sd, &sd->s_children, s_sibling) {
964 		ret = configfs_dump(child_sd, level + 2);
965 		if (ret)
966 			break;
967 	}
968 
969 	return ret;
970 }
971 #endif
972 
973 
974 /*
975  * configfs_depend_item() and configfs_undepend_item()
976  *
977  * WARNING: Do not call these from a configfs callback!
978  *
979  * This describes these functions and their helpers.
980  *
981  * Allow another kernel system to depend on a config_item.  If this
982  * happens, the item cannot go away until the dependent can live without
983  * it.  The idea is to give client modules as simple an interface as
984  * possible.  When a system asks them to depend on an item, they just
985  * call configfs_depend_item().  If the item is live and the client
986  * driver is in good shape, we'll happily do the work for them.
987  *
988  * Why is the locking complex?  Because configfs uses the VFS to handle
989  * all locking, but this function is called outside the normal
990  * VFS->configfs path.  So it must take VFS locks to prevent the
991  * VFS->configfs stuff (configfs_mkdir(), configfs_rmdir(), etc).  This is
992  * why you can't call these functions underneath configfs callbacks.
993  *
994  * Note, btw, that this can be called at *any* time, even when a configfs
995  * subsystem isn't registered, or when configfs is loading or unloading.
996  * Just like configfs_register_subsystem().  So we take the same
997  * precautions.  We pin the filesystem.  We lock configfs_dirent_lock.
998  * If we can find the target item in the
999  * configfs tree, it must be part of the subsystem tree as well, so we
1000  * do not need the subsystem semaphore.  Holding configfs_dirent_lock helps
1001  * locking out mkdir() and rmdir(), who might be racing us.
1002  */
1003 
1004 /*
1005  * configfs_depend_prep()
1006  *
1007  * Only subdirectories count here.  Files (CONFIGFS_NOT_PINNED) are
1008  * attributes.  This is similar but not the same to configfs_detach_prep().
1009  * Note that configfs_detach_prep() expects the parent to be locked when it
1010  * is called, but we lock the parent *inside* configfs_depend_prep().  We
1011  * do that so we can unlock it if we find nothing.
1012  *
1013  * Here we do a depth-first search of the dentry hierarchy looking for
1014  * our object.
1015  * We deliberately ignore items tagged as dropping since they are virtually
1016  * dead, as well as items in the middle of attachment since they virtually
1017  * do not exist yet. This completes the locking out of racing mkdir() and
1018  * rmdir().
1019  * Note: subdirectories in the middle of attachment start with s_type =
1020  * CONFIGFS_DIR|CONFIGFS_USET_CREATING set by create_dir().  When
1021  * CONFIGFS_USET_CREATING is set, we ignore the item.  The actual set of
1022  * s_type is in configfs_new_dirent(), which has configfs_dirent_lock.
1023  *
1024  * If the target is not found, -ENOENT is bubbled up.
1025  *
1026  * This adds a requirement that all config_items be unique!
1027  *
1028  * This is recursive.  There isn't
1029  * much on the stack, though, so folks that need this function - be careful
1030  * about your stack!  Patches will be accepted to make it iterative.
1031  */
1032 static int configfs_depend_prep(struct dentry *origin,
1033 				struct config_item *target)
1034 {
1035 	struct configfs_dirent *child_sd, *sd;
1036 	int ret = 0;
1037 
1038 	BUG_ON(!origin || !origin->d_fsdata);
1039 	sd = origin->d_fsdata;
1040 
1041 	if (sd->s_element == target)  /* Boo-yah */
1042 		goto out;
1043 
1044 	list_for_each_entry(child_sd, &sd->s_children, s_sibling) {
1045 		if ((child_sd->s_type & CONFIGFS_DIR) &&
1046 		    !(child_sd->s_type & CONFIGFS_USET_DROPPING) &&
1047 		    !(child_sd->s_type & CONFIGFS_USET_CREATING)) {
1048 			ret = configfs_depend_prep(child_sd->s_dentry,
1049 						   target);
1050 			if (!ret)
1051 				goto out;  /* Child path boo-yah */
1052 		}
1053 	}
1054 
1055 	/* We looped all our children and didn't find target */
1056 	ret = -ENOENT;
1057 
1058 out:
1059 	return ret;
1060 }
1061 
1062 static int configfs_do_depend_item(struct dentry *subsys_dentry,
1063 				   struct config_item *target)
1064 {
1065 	struct configfs_dirent *p;
1066 	int ret;
1067 
1068 	spin_lock(&configfs_dirent_lock);
1069 	/* Scan the tree, return 0 if found */
1070 	ret = configfs_depend_prep(subsys_dentry, target);
1071 	if (ret)
1072 		goto out_unlock_dirent_lock;
1073 
1074 	/*
1075 	 * We are sure that the item is not about to be removed by rmdir(), and
1076 	 * not in the middle of attachment by mkdir().
1077 	 */
1078 	p = target->ci_dentry->d_fsdata;
1079 	p->s_dependent_count += 1;
1080 
1081 out_unlock_dirent_lock:
1082 	spin_unlock(&configfs_dirent_lock);
1083 
1084 	return ret;
1085 }
1086 
1087 static inline struct configfs_dirent *
1088 configfs_find_subsys_dentry(struct configfs_dirent *root_sd,
1089 			    struct config_item *subsys_item)
1090 {
1091 	struct configfs_dirent *p;
1092 	struct configfs_dirent *ret = NULL;
1093 
1094 	list_for_each_entry(p, &root_sd->s_children, s_sibling) {
1095 		if (p->s_type & CONFIGFS_DIR &&
1096 		    p->s_element == subsys_item) {
1097 			ret = p;
1098 			break;
1099 		}
1100 	}
1101 
1102 	return ret;
1103 }
1104 
1105 
1106 int configfs_depend_item(struct configfs_subsystem *subsys,
1107 			 struct config_item *target)
1108 {
1109 	int ret;
1110 	struct configfs_dirent *subsys_sd;
1111 	struct config_item *s_item = &subsys->su_group.cg_item;
1112 	struct dentry *root;
1113 
1114 	/*
1115 	 * Pin the configfs filesystem.  This means we can safely access
1116 	 * the root of the configfs filesystem.
1117 	 */
1118 	root = configfs_pin_fs();
1119 	if (IS_ERR(root))
1120 		return PTR_ERR(root);
1121 
1122 	/*
1123 	 * Next, lock the root directory.  We're going to check that the
1124 	 * subsystem is really registered, and so we need to lock out
1125 	 * configfs_[un]register_subsystem().
1126 	 */
1127 	inode_lock(d_inode(root));
1128 
1129 	subsys_sd = configfs_find_subsys_dentry(root->d_fsdata, s_item);
1130 	if (!subsys_sd) {
1131 		ret = -ENOENT;
1132 		goto out_unlock_fs;
1133 	}
1134 
1135 	/* Ok, now we can trust subsys/s_item */
1136 	ret = configfs_do_depend_item(subsys_sd->s_dentry, target);
1137 
1138 out_unlock_fs:
1139 	inode_unlock(d_inode(root));
1140 
1141 	/*
1142 	 * If we succeeded, the fs is pinned via other methods.  If not,
1143 	 * we're done with it anyway.  So release_fs() is always right.
1144 	 */
1145 	configfs_release_fs();
1146 
1147 	return ret;
1148 }
1149 EXPORT_SYMBOL(configfs_depend_item);
1150 
1151 /*
1152  * Release the dependent linkage.  This is much simpler than
1153  * configfs_depend_item() because we know that the client driver is
1154  * pinned, thus the subsystem is pinned, and therefore configfs is pinned.
1155  */
1156 void configfs_undepend_item(struct config_item *target)
1157 {
1158 	struct configfs_dirent *sd;
1159 
1160 	/*
1161 	 * Since we can trust everything is pinned, we just need
1162 	 * configfs_dirent_lock.
1163 	 */
1164 	spin_lock(&configfs_dirent_lock);
1165 
1166 	sd = target->ci_dentry->d_fsdata;
1167 	BUG_ON(sd->s_dependent_count < 1);
1168 
1169 	sd->s_dependent_count -= 1;
1170 
1171 	/*
1172 	 * After this unlock, we cannot trust the item to stay alive!
1173 	 * DO NOT REFERENCE item after this unlock.
1174 	 */
1175 	spin_unlock(&configfs_dirent_lock);
1176 }
1177 EXPORT_SYMBOL(configfs_undepend_item);
1178 
1179 /*
1180  * caller_subsys is a caller's subsystem not target's. This is used to
1181  * determine if we should lock root and check subsys or not. When we are
1182  * in the same subsystem as our target there is no need to do locking as
1183  * we know that subsys is valid and is not unregistered during this function
1184  * as we are called from callback of one of his children and VFS holds a lock
1185  * on some inode. Otherwise we have to lock our root to  ensure that target's
1186  * subsystem it is not unregistered during this function.
1187  */
1188 int configfs_depend_item_unlocked(struct configfs_subsystem *caller_subsys,
1189 				  struct config_item *target)
1190 {
1191 	struct configfs_subsystem *target_subsys;
1192 	struct config_group *root, *parent;
1193 	struct configfs_dirent *subsys_sd;
1194 	int ret = -ENOENT;
1195 
1196 	/* Disallow this function for configfs root */
1197 	if (configfs_is_root(target))
1198 		return -EINVAL;
1199 
1200 	parent = target->ci_group;
1201 	/*
1202 	 * This may happen when someone is trying to depend root
1203 	 * directory of some subsystem
1204 	 */
1205 	if (configfs_is_root(&parent->cg_item)) {
1206 		target_subsys = to_configfs_subsystem(to_config_group(target));
1207 		root = parent;
1208 	} else {
1209 		target_subsys = parent->cg_subsys;
1210 		/* Find a cofnigfs root as we may need it for locking */
1211 		for (root = parent; !configfs_is_root(&root->cg_item);
1212 		     root = root->cg_item.ci_group)
1213 			;
1214 	}
1215 
1216 	if (target_subsys != caller_subsys) {
1217 		/*
1218 		 * We are in other configfs subsystem, so we have to do
1219 		 * additional locking to prevent other subsystem from being
1220 		 * unregistered
1221 		 */
1222 		inode_lock(d_inode(root->cg_item.ci_dentry));
1223 
1224 		/*
1225 		 * As we are trying to depend item from other subsystem
1226 		 * we have to check if this subsystem is still registered
1227 		 */
1228 		subsys_sd = configfs_find_subsys_dentry(
1229 				root->cg_item.ci_dentry->d_fsdata,
1230 				&target_subsys->su_group.cg_item);
1231 		if (!subsys_sd)
1232 			goto out_root_unlock;
1233 	} else {
1234 		subsys_sd = target_subsys->su_group.cg_item.ci_dentry->d_fsdata;
1235 	}
1236 
1237 	/* Now we can execute core of depend item */
1238 	ret = configfs_do_depend_item(subsys_sd->s_dentry, target);
1239 
1240 	if (target_subsys != caller_subsys)
1241 out_root_unlock:
1242 		/*
1243 		 * We were called from subsystem other than our target so we
1244 		 * took some locks so now it's time to release them
1245 		 */
1246 		inode_unlock(d_inode(root->cg_item.ci_dentry));
1247 
1248 	return ret;
1249 }
1250 EXPORT_SYMBOL(configfs_depend_item_unlocked);
1251 
1252 static int configfs_mkdir(struct user_namespace *mnt_userns, struct inode *dir,
1253 			  struct dentry *dentry, umode_t mode)
1254 {
1255 	int ret = 0;
1256 	int module_got = 0;
1257 	struct config_group *group = NULL;
1258 	struct config_item *item = NULL;
1259 	struct config_item *parent_item;
1260 	struct configfs_subsystem *subsys;
1261 	struct configfs_dirent *sd;
1262 	const struct config_item_type *type;
1263 	struct module *subsys_owner = NULL, *new_item_owner = NULL;
1264 	struct configfs_fragment *frag;
1265 	char *name;
1266 
1267 	sd = dentry->d_parent->d_fsdata;
1268 
1269 	/*
1270 	 * Fake invisibility if dir belongs to a group/default groups hierarchy
1271 	 * being attached
1272 	 */
1273 	if (!configfs_dirent_is_ready(sd)) {
1274 		ret = -ENOENT;
1275 		goto out;
1276 	}
1277 
1278 	if (!(sd->s_type & CONFIGFS_USET_DIR)) {
1279 		ret = -EPERM;
1280 		goto out;
1281 	}
1282 
1283 	frag = new_fragment();
1284 	if (!frag) {
1285 		ret = -ENOMEM;
1286 		goto out;
1287 	}
1288 
1289 	/* Get a working ref for the duration of this function */
1290 	parent_item = configfs_get_config_item(dentry->d_parent);
1291 	type = parent_item->ci_type;
1292 	subsys = to_config_group(parent_item)->cg_subsys;
1293 	BUG_ON(!subsys);
1294 
1295 	if (!type || !type->ct_group_ops ||
1296 	    (!type->ct_group_ops->make_group &&
1297 	     !type->ct_group_ops->make_item)) {
1298 		ret = -EPERM;  /* Lack-of-mkdir returns -EPERM */
1299 		goto out_put;
1300 	}
1301 
1302 	/*
1303 	 * The subsystem may belong to a different module than the item
1304 	 * being created.  We don't want to safely pin the new item but
1305 	 * fail to pin the subsystem it sits under.
1306 	 */
1307 	if (!subsys->su_group.cg_item.ci_type) {
1308 		ret = -EINVAL;
1309 		goto out_put;
1310 	}
1311 	subsys_owner = subsys->su_group.cg_item.ci_type->ct_owner;
1312 	if (!try_module_get(subsys_owner)) {
1313 		ret = -EINVAL;
1314 		goto out_put;
1315 	}
1316 
1317 	name = kmalloc(dentry->d_name.len + 1, GFP_KERNEL);
1318 	if (!name) {
1319 		ret = -ENOMEM;
1320 		goto out_subsys_put;
1321 	}
1322 
1323 	snprintf(name, dentry->d_name.len + 1, "%s", dentry->d_name.name);
1324 
1325 	mutex_lock(&subsys->su_mutex);
1326 	if (type->ct_group_ops->make_group) {
1327 		group = type->ct_group_ops->make_group(to_config_group(parent_item), name);
1328 		if (!group)
1329 			group = ERR_PTR(-ENOMEM);
1330 		if (!IS_ERR(group)) {
1331 			link_group(to_config_group(parent_item), group);
1332 			item = &group->cg_item;
1333 		} else
1334 			ret = PTR_ERR(group);
1335 	} else {
1336 		item = type->ct_group_ops->make_item(to_config_group(parent_item), name);
1337 		if (!item)
1338 			item = ERR_PTR(-ENOMEM);
1339 		if (!IS_ERR(item))
1340 			link_obj(parent_item, item);
1341 		else
1342 			ret = PTR_ERR(item);
1343 	}
1344 	mutex_unlock(&subsys->su_mutex);
1345 
1346 	kfree(name);
1347 	if (ret) {
1348 		/*
1349 		 * If ret != 0, then link_obj() was never called.
1350 		 * There are no extra references to clean up.
1351 		 */
1352 		goto out_subsys_put;
1353 	}
1354 
1355 	/*
1356 	 * link_obj() has been called (via link_group() for groups).
1357 	 * From here on out, errors must clean that up.
1358 	 */
1359 
1360 	type = item->ci_type;
1361 	if (!type) {
1362 		ret = -EINVAL;
1363 		goto out_unlink;
1364 	}
1365 
1366 	new_item_owner = type->ct_owner;
1367 	if (!try_module_get(new_item_owner)) {
1368 		ret = -EINVAL;
1369 		goto out_unlink;
1370 	}
1371 
1372 	/*
1373 	 * I hate doing it this way, but if there is
1374 	 * an error,  module_put() probably should
1375 	 * happen after any cleanup.
1376 	 */
1377 	module_got = 1;
1378 
1379 	/*
1380 	 * Make racing rmdir() fail if it did not tag parent with
1381 	 * CONFIGFS_USET_DROPPING
1382 	 * Note: if CONFIGFS_USET_DROPPING is already set, attach_group() will
1383 	 * fail and let rmdir() terminate correctly
1384 	 */
1385 	spin_lock(&configfs_dirent_lock);
1386 	/* This will make configfs_detach_prep() fail */
1387 	sd->s_type |= CONFIGFS_USET_IN_MKDIR;
1388 	spin_unlock(&configfs_dirent_lock);
1389 
1390 	if (group)
1391 		ret = configfs_attach_group(parent_item, item, dentry, frag);
1392 	else
1393 		ret = configfs_attach_item(parent_item, item, dentry, frag);
1394 
1395 	spin_lock(&configfs_dirent_lock);
1396 	sd->s_type &= ~CONFIGFS_USET_IN_MKDIR;
1397 	if (!ret)
1398 		configfs_dir_set_ready(dentry->d_fsdata);
1399 	spin_unlock(&configfs_dirent_lock);
1400 
1401 out_unlink:
1402 	if (ret) {
1403 		/* Tear down everything we built up */
1404 		mutex_lock(&subsys->su_mutex);
1405 
1406 		client_disconnect_notify(parent_item, item);
1407 		if (group)
1408 			unlink_group(group);
1409 		else
1410 			unlink_obj(item);
1411 		client_drop_item(parent_item, item);
1412 
1413 		mutex_unlock(&subsys->su_mutex);
1414 
1415 		if (module_got)
1416 			module_put(new_item_owner);
1417 	}
1418 
1419 out_subsys_put:
1420 	if (ret)
1421 		module_put(subsys_owner);
1422 
1423 out_put:
1424 	/*
1425 	 * link_obj()/link_group() took a reference from child->parent,
1426 	 * so the parent is safely pinned.  We can drop our working
1427 	 * reference.
1428 	 */
1429 	config_item_put(parent_item);
1430 	put_fragment(frag);
1431 
1432 out:
1433 	return ret;
1434 }
1435 
1436 static int configfs_rmdir(struct inode *dir, struct dentry *dentry)
1437 {
1438 	struct config_item *parent_item;
1439 	struct config_item *item;
1440 	struct configfs_subsystem *subsys;
1441 	struct configfs_dirent *sd;
1442 	struct configfs_fragment *frag;
1443 	struct module *subsys_owner = NULL, *dead_item_owner = NULL;
1444 	int ret;
1445 
1446 	sd = dentry->d_fsdata;
1447 	if (sd->s_type & CONFIGFS_USET_DEFAULT)
1448 		return -EPERM;
1449 
1450 	/* Get a working ref until we have the child */
1451 	parent_item = configfs_get_config_item(dentry->d_parent);
1452 	subsys = to_config_group(parent_item)->cg_subsys;
1453 	BUG_ON(!subsys);
1454 
1455 	if (!parent_item->ci_type) {
1456 		config_item_put(parent_item);
1457 		return -EINVAL;
1458 	}
1459 
1460 	/* configfs_mkdir() shouldn't have allowed this */
1461 	BUG_ON(!subsys->su_group.cg_item.ci_type);
1462 	subsys_owner = subsys->su_group.cg_item.ci_type->ct_owner;
1463 
1464 	/*
1465 	 * Ensure that no racing symlink() will make detach_prep() fail while
1466 	 * the new link is temporarily attached
1467 	 */
1468 	do {
1469 		struct dentry *wait;
1470 
1471 		mutex_lock(&configfs_symlink_mutex);
1472 		spin_lock(&configfs_dirent_lock);
1473 		/*
1474 		 * Here's where we check for dependents.  We're protected by
1475 		 * configfs_dirent_lock.
1476 		 * If no dependent, atomically tag the item as dropping.
1477 		 */
1478 		ret = sd->s_dependent_count ? -EBUSY : 0;
1479 		if (!ret) {
1480 			ret = configfs_detach_prep(dentry, &wait);
1481 			if (ret)
1482 				configfs_detach_rollback(dentry);
1483 		}
1484 		spin_unlock(&configfs_dirent_lock);
1485 		mutex_unlock(&configfs_symlink_mutex);
1486 
1487 		if (ret) {
1488 			if (ret != -EAGAIN) {
1489 				config_item_put(parent_item);
1490 				return ret;
1491 			}
1492 
1493 			/* Wait until the racing operation terminates */
1494 			inode_lock(d_inode(wait));
1495 			inode_unlock(d_inode(wait));
1496 			dput(wait);
1497 		}
1498 	} while (ret == -EAGAIN);
1499 
1500 	frag = sd->s_frag;
1501 	if (down_write_killable(&frag->frag_sem)) {
1502 		spin_lock(&configfs_dirent_lock);
1503 		configfs_detach_rollback(dentry);
1504 		spin_unlock(&configfs_dirent_lock);
1505 		config_item_put(parent_item);
1506 		return -EINTR;
1507 	}
1508 	frag->frag_dead = true;
1509 	up_write(&frag->frag_sem);
1510 
1511 	/* Get a working ref for the duration of this function */
1512 	item = configfs_get_config_item(dentry);
1513 
1514 	/* Drop reference from above, item already holds one. */
1515 	config_item_put(parent_item);
1516 
1517 	if (item->ci_type)
1518 		dead_item_owner = item->ci_type->ct_owner;
1519 
1520 	if (sd->s_type & CONFIGFS_USET_DIR) {
1521 		configfs_detach_group(item);
1522 
1523 		mutex_lock(&subsys->su_mutex);
1524 		client_disconnect_notify(parent_item, item);
1525 		unlink_group(to_config_group(item));
1526 	} else {
1527 		configfs_detach_item(item);
1528 
1529 		mutex_lock(&subsys->su_mutex);
1530 		client_disconnect_notify(parent_item, item);
1531 		unlink_obj(item);
1532 	}
1533 
1534 	client_drop_item(parent_item, item);
1535 	mutex_unlock(&subsys->su_mutex);
1536 
1537 	/* Drop our reference from above */
1538 	config_item_put(item);
1539 
1540 	module_put(dead_item_owner);
1541 	module_put(subsys_owner);
1542 
1543 	return 0;
1544 }
1545 
1546 const struct inode_operations configfs_dir_inode_operations = {
1547 	.mkdir		= configfs_mkdir,
1548 	.rmdir		= configfs_rmdir,
1549 	.symlink	= configfs_symlink,
1550 	.unlink		= configfs_unlink,
1551 	.lookup		= configfs_lookup,
1552 	.setattr	= configfs_setattr,
1553 };
1554 
1555 const struct inode_operations configfs_root_inode_operations = {
1556 	.lookup		= configfs_lookup,
1557 	.setattr	= configfs_setattr,
1558 };
1559 
1560 static int configfs_dir_open(struct inode *inode, struct file *file)
1561 {
1562 	struct dentry * dentry = file->f_path.dentry;
1563 	struct configfs_dirent * parent_sd = dentry->d_fsdata;
1564 	int err;
1565 
1566 	inode_lock(d_inode(dentry));
1567 	/*
1568 	 * Fake invisibility if dir belongs to a group/default groups hierarchy
1569 	 * being attached
1570 	 */
1571 	err = -ENOENT;
1572 	if (configfs_dirent_is_ready(parent_sd)) {
1573 		file->private_data = configfs_new_dirent(parent_sd, NULL, 0, NULL);
1574 		if (IS_ERR(file->private_data))
1575 			err = PTR_ERR(file->private_data);
1576 		else
1577 			err = 0;
1578 	}
1579 	inode_unlock(d_inode(dentry));
1580 
1581 	return err;
1582 }
1583 
1584 static int configfs_dir_close(struct inode *inode, struct file *file)
1585 {
1586 	struct dentry * dentry = file->f_path.dentry;
1587 	struct configfs_dirent * cursor = file->private_data;
1588 
1589 	inode_lock(d_inode(dentry));
1590 	spin_lock(&configfs_dirent_lock);
1591 	list_del_init(&cursor->s_sibling);
1592 	spin_unlock(&configfs_dirent_lock);
1593 	inode_unlock(d_inode(dentry));
1594 
1595 	release_configfs_dirent(cursor);
1596 
1597 	return 0;
1598 }
1599 
1600 /* Relationship between s_mode and the DT_xxx types */
1601 static inline unsigned char dt_type(struct configfs_dirent *sd)
1602 {
1603 	return (sd->s_mode >> 12) & 15;
1604 }
1605 
1606 static int configfs_readdir(struct file *file, struct dir_context *ctx)
1607 {
1608 	struct dentry *dentry = file->f_path.dentry;
1609 	struct super_block *sb = dentry->d_sb;
1610 	struct configfs_dirent * parent_sd = dentry->d_fsdata;
1611 	struct configfs_dirent *cursor = file->private_data;
1612 	struct list_head *p, *q = &cursor->s_sibling;
1613 	ino_t ino = 0;
1614 
1615 	if (!dir_emit_dots(file, ctx))
1616 		return 0;
1617 	spin_lock(&configfs_dirent_lock);
1618 	if (ctx->pos == 2)
1619 		list_move(q, &parent_sd->s_children);
1620 	for (p = q->next; p != &parent_sd->s_children; p = p->next) {
1621 		struct configfs_dirent *next;
1622 		const char *name;
1623 		int len;
1624 		struct inode *inode = NULL;
1625 
1626 		next = list_entry(p, struct configfs_dirent, s_sibling);
1627 		if (!next->s_element)
1628 			continue;
1629 
1630 		/*
1631 		 * We'll have a dentry and an inode for
1632 		 * PINNED items and for open attribute
1633 		 * files.  We lock here to prevent a race
1634 		 * with configfs_d_iput() clearing
1635 		 * s_dentry before calling iput().
1636 		 *
1637 		 * Why do we go to the trouble?  If
1638 		 * someone has an attribute file open,
1639 		 * the inode number should match until
1640 		 * they close it.  Beyond that, we don't
1641 		 * care.
1642 		 */
1643 		dentry = next->s_dentry;
1644 		if (dentry)
1645 			inode = d_inode(dentry);
1646 		if (inode)
1647 			ino = inode->i_ino;
1648 		spin_unlock(&configfs_dirent_lock);
1649 		if (!inode)
1650 			ino = iunique(sb, 2);
1651 
1652 		name = configfs_get_name(next);
1653 		len = strlen(name);
1654 
1655 		if (!dir_emit(ctx, name, len, ino, dt_type(next)))
1656 			return 0;
1657 
1658 		spin_lock(&configfs_dirent_lock);
1659 		list_move(q, p);
1660 		p = q;
1661 		ctx->pos++;
1662 	}
1663 	spin_unlock(&configfs_dirent_lock);
1664 	return 0;
1665 }
1666 
1667 static loff_t configfs_dir_lseek(struct file *file, loff_t offset, int whence)
1668 {
1669 	struct dentry * dentry = file->f_path.dentry;
1670 
1671 	switch (whence) {
1672 		case 1:
1673 			offset += file->f_pos;
1674 			fallthrough;
1675 		case 0:
1676 			if (offset >= 0)
1677 				break;
1678 			fallthrough;
1679 		default:
1680 			return -EINVAL;
1681 	}
1682 	if (offset != file->f_pos) {
1683 		file->f_pos = offset;
1684 		if (file->f_pos >= 2) {
1685 			struct configfs_dirent *sd = dentry->d_fsdata;
1686 			struct configfs_dirent *cursor = file->private_data;
1687 			struct list_head *p;
1688 			loff_t n = file->f_pos - 2;
1689 
1690 			spin_lock(&configfs_dirent_lock);
1691 			list_del(&cursor->s_sibling);
1692 			p = sd->s_children.next;
1693 			while (n && p != &sd->s_children) {
1694 				struct configfs_dirent *next;
1695 				next = list_entry(p, struct configfs_dirent,
1696 						   s_sibling);
1697 				if (next->s_element)
1698 					n--;
1699 				p = p->next;
1700 			}
1701 			list_add_tail(&cursor->s_sibling, p);
1702 			spin_unlock(&configfs_dirent_lock);
1703 		}
1704 	}
1705 	return offset;
1706 }
1707 
1708 const struct file_operations configfs_dir_operations = {
1709 	.open		= configfs_dir_open,
1710 	.release	= configfs_dir_close,
1711 	.llseek		= configfs_dir_lseek,
1712 	.read		= generic_read_dir,
1713 	.iterate_shared	= configfs_readdir,
1714 };
1715 
1716 /**
1717  * configfs_register_group - creates a parent-child relation between two groups
1718  * @parent_group:	parent group
1719  * @group:		child group
1720  *
1721  * link groups, creates dentry for the child and attaches it to the
1722  * parent dentry.
1723  *
1724  * Return: 0 on success, negative errno code on error
1725  */
1726 int configfs_register_group(struct config_group *parent_group,
1727 			    struct config_group *group)
1728 {
1729 	struct configfs_subsystem *subsys = parent_group->cg_subsys;
1730 	struct dentry *parent;
1731 	struct configfs_fragment *frag;
1732 	int ret;
1733 
1734 	frag = new_fragment();
1735 	if (!frag)
1736 		return -ENOMEM;
1737 
1738 	mutex_lock(&subsys->su_mutex);
1739 	link_group(parent_group, group);
1740 	mutex_unlock(&subsys->su_mutex);
1741 
1742 	parent = parent_group->cg_item.ci_dentry;
1743 
1744 	inode_lock_nested(d_inode(parent), I_MUTEX_PARENT);
1745 	ret = create_default_group(parent_group, group, frag);
1746 	if (ret)
1747 		goto err_out;
1748 
1749 	spin_lock(&configfs_dirent_lock);
1750 	configfs_dir_set_ready(group->cg_item.ci_dentry->d_fsdata);
1751 	spin_unlock(&configfs_dirent_lock);
1752 	inode_unlock(d_inode(parent));
1753 	put_fragment(frag);
1754 	return 0;
1755 err_out:
1756 	inode_unlock(d_inode(parent));
1757 	mutex_lock(&subsys->su_mutex);
1758 	unlink_group(group);
1759 	mutex_unlock(&subsys->su_mutex);
1760 	put_fragment(frag);
1761 	return ret;
1762 }
1763 EXPORT_SYMBOL(configfs_register_group);
1764 
1765 /**
1766  * configfs_unregister_group() - unregisters a child group from its parent
1767  * @group: parent group to be unregistered
1768  *
1769  * Undoes configfs_register_group()
1770  */
1771 void configfs_unregister_group(struct config_group *group)
1772 {
1773 	struct configfs_subsystem *subsys = group->cg_subsys;
1774 	struct dentry *dentry = group->cg_item.ci_dentry;
1775 	struct dentry *parent = group->cg_item.ci_parent->ci_dentry;
1776 	struct configfs_dirent *sd = dentry->d_fsdata;
1777 	struct configfs_fragment *frag = sd->s_frag;
1778 
1779 	down_write(&frag->frag_sem);
1780 	frag->frag_dead = true;
1781 	up_write(&frag->frag_sem);
1782 
1783 	inode_lock_nested(d_inode(parent), I_MUTEX_PARENT);
1784 	spin_lock(&configfs_dirent_lock);
1785 	configfs_detach_prep(dentry, NULL);
1786 	spin_unlock(&configfs_dirent_lock);
1787 
1788 	configfs_detach_group(&group->cg_item);
1789 	d_inode(dentry)->i_flags |= S_DEAD;
1790 	dont_mount(dentry);
1791 	d_drop(dentry);
1792 	fsnotify_rmdir(d_inode(parent), dentry);
1793 	inode_unlock(d_inode(parent));
1794 
1795 	dput(dentry);
1796 
1797 	mutex_lock(&subsys->su_mutex);
1798 	unlink_group(group);
1799 	mutex_unlock(&subsys->su_mutex);
1800 }
1801 EXPORT_SYMBOL(configfs_unregister_group);
1802 
1803 /**
1804  * configfs_register_default_group() - allocates and registers a child group
1805  * @parent_group:	parent group
1806  * @name:		child group name
1807  * @item_type:		child item type description
1808  *
1809  * boilerplate to allocate and register a child group with its parent. We need
1810  * kzalloc'ed memory because child's default_group is initially empty.
1811  *
1812  * Return: allocated config group or ERR_PTR() on error
1813  */
1814 struct config_group *
1815 configfs_register_default_group(struct config_group *parent_group,
1816 				const char *name,
1817 				const struct config_item_type *item_type)
1818 {
1819 	int ret;
1820 	struct config_group *group;
1821 
1822 	group = kzalloc(sizeof(*group), GFP_KERNEL);
1823 	if (!group)
1824 		return ERR_PTR(-ENOMEM);
1825 	config_group_init_type_name(group, name, item_type);
1826 
1827 	ret = configfs_register_group(parent_group, group);
1828 	if (ret) {
1829 		kfree(group);
1830 		return ERR_PTR(ret);
1831 	}
1832 	return group;
1833 }
1834 EXPORT_SYMBOL(configfs_register_default_group);
1835 
1836 /**
1837  * configfs_unregister_default_group() - unregisters and frees a child group
1838  * @group:	the group to act on
1839  */
1840 void configfs_unregister_default_group(struct config_group *group)
1841 {
1842 	configfs_unregister_group(group);
1843 	kfree(group);
1844 }
1845 EXPORT_SYMBOL(configfs_unregister_default_group);
1846 
1847 int configfs_register_subsystem(struct configfs_subsystem *subsys)
1848 {
1849 	int err;
1850 	struct config_group *group = &subsys->su_group;
1851 	struct dentry *dentry;
1852 	struct dentry *root;
1853 	struct configfs_dirent *sd;
1854 	struct configfs_fragment *frag;
1855 
1856 	frag = new_fragment();
1857 	if (!frag)
1858 		return -ENOMEM;
1859 
1860 	root = configfs_pin_fs();
1861 	if (IS_ERR(root)) {
1862 		put_fragment(frag);
1863 		return PTR_ERR(root);
1864 	}
1865 
1866 	if (!group->cg_item.ci_name)
1867 		group->cg_item.ci_name = group->cg_item.ci_namebuf;
1868 
1869 	sd = root->d_fsdata;
1870 	mutex_lock(&configfs_subsystem_mutex);
1871 	link_group(to_config_group(sd->s_element), group);
1872 	mutex_unlock(&configfs_subsystem_mutex);
1873 
1874 	inode_lock_nested(d_inode(root), I_MUTEX_PARENT);
1875 
1876 	err = -ENOMEM;
1877 	dentry = d_alloc_name(root, group->cg_item.ci_name);
1878 	if (dentry) {
1879 		d_add(dentry, NULL);
1880 
1881 		err = configfs_attach_group(sd->s_element, &group->cg_item,
1882 					    dentry, frag);
1883 		if (err) {
1884 			BUG_ON(d_inode(dentry));
1885 			d_drop(dentry);
1886 			dput(dentry);
1887 		} else {
1888 			spin_lock(&configfs_dirent_lock);
1889 			configfs_dir_set_ready(dentry->d_fsdata);
1890 			spin_unlock(&configfs_dirent_lock);
1891 		}
1892 	}
1893 
1894 	inode_unlock(d_inode(root));
1895 
1896 	if (err) {
1897 		mutex_lock(&configfs_subsystem_mutex);
1898 		unlink_group(group);
1899 		mutex_unlock(&configfs_subsystem_mutex);
1900 		configfs_release_fs();
1901 	}
1902 	put_fragment(frag);
1903 
1904 	return err;
1905 }
1906 
1907 void configfs_unregister_subsystem(struct configfs_subsystem *subsys)
1908 {
1909 	struct config_group *group = &subsys->su_group;
1910 	struct dentry *dentry = group->cg_item.ci_dentry;
1911 	struct dentry *root = dentry->d_sb->s_root;
1912 	struct configfs_dirent *sd = dentry->d_fsdata;
1913 	struct configfs_fragment *frag = sd->s_frag;
1914 
1915 	if (dentry->d_parent != root) {
1916 		pr_err("Tried to unregister non-subsystem!\n");
1917 		return;
1918 	}
1919 
1920 	down_write(&frag->frag_sem);
1921 	frag->frag_dead = true;
1922 	up_write(&frag->frag_sem);
1923 
1924 	inode_lock_nested(d_inode(root),
1925 			  I_MUTEX_PARENT);
1926 	inode_lock_nested(d_inode(dentry), I_MUTEX_CHILD);
1927 	mutex_lock(&configfs_symlink_mutex);
1928 	spin_lock(&configfs_dirent_lock);
1929 	if (configfs_detach_prep(dentry, NULL)) {
1930 		pr_err("Tried to unregister non-empty subsystem!\n");
1931 	}
1932 	spin_unlock(&configfs_dirent_lock);
1933 	mutex_unlock(&configfs_symlink_mutex);
1934 	configfs_detach_group(&group->cg_item);
1935 	d_inode(dentry)->i_flags |= S_DEAD;
1936 	dont_mount(dentry);
1937 	inode_unlock(d_inode(dentry));
1938 
1939 	d_drop(dentry);
1940 	fsnotify_rmdir(d_inode(root), dentry);
1941 
1942 	inode_unlock(d_inode(root));
1943 
1944 	dput(dentry);
1945 
1946 	mutex_lock(&configfs_subsystem_mutex);
1947 	unlink_group(group);
1948 	mutex_unlock(&configfs_subsystem_mutex);
1949 	configfs_release_fs();
1950 }
1951 
1952 EXPORT_SYMBOL(configfs_register_subsystem);
1953 EXPORT_SYMBOL(configfs_unregister_subsystem);
1954